diff --git "a/perplexity25/3491058.out" "b/perplexity25/3491058.out" new file mode 100644--- /dev/null +++ "b/perplexity25/3491058.out" @@ -0,0 +1,40510 @@ +Model parameters: d_model 2560 ffw_size 10240 kv_size 128 n_heads 20 n_layers 34 +Megatron-DeepSpeed/pretrain_gpt.py --tensor-model-parallel-size 2 --pipeline-model-parallel-size 1 --num-layers 34 --hidden-size 2560 --num-attention-heads 20 --kv-channels 128 --ffn-hidden-size 10240 --seq-length 2048 --max-position-embeddings 2048 --micro-batch-size 2 --global-batch-size 1024 --train-samples 1 --vocab-file gpt2/vocab.json --merge-file gpt2/merges.txt --clip-grad 1.0 --kill-switch-path kill-switch-4b284b84bperplexity25val --bf16 --optimizer adam --adam-beta1 0.9 --adam-beta2 0.999 --adam-eps 1e-8 --lr 2e-4 --min-lr 2e-5 --lr-decay-style cosine --lr-decay-samples 1 --lr-warmup-samples 0 --clip-grad 1.0 --weight-decay 1e-1 --override-lr-scheduler --reset-progress --no-load-optim --log-interval 10 --save-interval 1000 --eval-interval 1 --eval-iters 100 --eval-only true --tensorboard-dir tensorboard_4b284b84bperplexity25val --tensorboard-queue-size 5 --log-timers-to-tensorboard --log-batch-size-to-tensorboard --log-validation-ppl-to-tensorboard --save lm1-4b2-84b-c4-perplexity/perplexity25 --load lm1-4b2-84b-c4-perplexity/perplexity25 --train-weighted-split-paths-path train1b5.txt --valid-weighted-split-paths-path val.txt --data-impl mmap --deepspeed --deepspeed_config ds_configs/3491058.json --zero-stage 0 +START 3491058: Wed 10 May 2023 12:33:30 PM EEST + 0: + 0: + 0: ======================= ROCm System Management Interface ======================= + 0: ================================= Concise Info ================================= + 0: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% + 0: 0 40.0c 92.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 0: 1 49.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 0: 2 46.0c 95.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 0: 3 42.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 0: 4 43.0c 90.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 0: 5 47.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 0: 6 38.0c 87.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 0: 7 42.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 0: ================================================================================ + 0: ============================= End of ROCm SMI Log ============================== + 3: + 3: + 3: ======================= ROCm System Management Interface ======================= + 3: ================================= Concise Info ================================= + 3: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% + 3: 0 45.0c 94.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 3: 1 44.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 3: 2 44.0c 87.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 3: 3 45.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 3: 4 43.0c 83.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 3: 5 46.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 3: 6 41.0c 87.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 3: 7 44.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 3: ================================================================================ + 3: ============================= End of ROCm SMI Log ============================== + 1: + 1: + 1: ======================= ROCm System Management Interface ======================= + 1: ================================= Concise Info ================================= + 1: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% + 1: 0 46.0c 89.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 1: 1 44.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 1: 2 38.0c 91.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 1: 3 43.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 1: 4 43.0c 94.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 1: 5 47.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 1: 6 39.0c 90.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 1: 7 46.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 1: ================================================================================ + 1: ============================= End of ROCm SMI Log ============================== +20: +20: +20: ======================= ROCm System Management Interface ======================= +20: ================================= Concise Info ================================= +20: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +20: 0 45.0c 87.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +20: 1 45.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +20: 2 42.0c 90.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +20: 3 46.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +20: 4 41.0c 86.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +20: 5 44.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +20: 6 42.0c 90.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +20: 7 47.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +20: ================================================================================ +20: ============================= End of ROCm SMI Log ============================== + 8: + 8: + 8: ======================= ROCm System Management Interface ======================= + 8: ================================= Concise Info ================================= + 8: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% + 8: 0 48.0c 94.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 8: 1 44.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 8: 2 41.0c 82.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 8: 3 49.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 8: 4 40.0c 90.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 8: 5 48.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 8: 6 39.0c 91.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 8: 7 43.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 8: ================================================================================ + 8: ============================= End of ROCm SMI Log ============================== +25: +25: +25: ======================= ROCm System Management Interface ======================= +25: ================================= Concise Info ================================= +25: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +25: 0 42.0c 90.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +25: 1 51.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +25: 2 38.0c 87.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +25: 3 48.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +25: 4 42.0c 92.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +25: 5 42.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +25: 6 43.0c 96.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +25: 7 42.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +25: ================================================================================ +25: ============================= End of ROCm SMI Log ============================== +28: +28: +28: ======================= ROCm System Management Interface ======================= +28: ================================= Concise Info ================================= +28: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +28: 0 49.0c 88.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +28: 1 48.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +28: 2 42.0c 90.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +28: 3 48.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +28: 4 42.0c 93.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +28: 5 48.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +28: 6 40.0c 86.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +28: 7 47.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +28: ================================================================================ +28: ============================= End of ROCm SMI Log ============================== +26: +26: +26: ======================= ROCm System Management Interface ======================= +26: ================================= Concise Info ================================= +26: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +26: 0 44.0c 96.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +26: 1 50.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +26: 2 43.0c 90.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +26: 3 44.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +26: 4 40.0c 90.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +26: 5 48.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +26: 6 43.0c 84.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +26: 7 46.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +26: ================================================================================ +26: ============================= End of ROCm SMI Log ============================== + 2: + 2: + 2: ======================= ROCm System Management Interface ======================= + 2: ================================= Concise Info ================================= + 2: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% + 2: 0 42.0c 91.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 2: 1 50.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 2: 2 35.0c 94.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 2: 3 47.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 2: 4 44.0c 85.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 2: 5 44.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 2: 6 40.0c 88.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 2: 7 48.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 2: ================================================================================ + 2: ============================= End of ROCm SMI Log ============================== +14: +14: +14: ======================= ROCm System Management Interface ======================= +14: ================================= Concise Info ================================= +14: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +14: 0 44.0c 94.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +14: 1 46.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +14: 2 40.0c 85.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +14: 3 45.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +14: 4 45.0c 88.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +14: 5 42.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +14: 6 40.0c 94.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +14: 7 43.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +14: ================================================================================ +14: ============================= End of ROCm SMI Log ============================== +15: +15: +15: ======================= ROCm System Management Interface ======================= +15: ================================= Concise Info ================================= +15: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +15: 0 46.0c 91.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +15: 1 45.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +15: 2 42.0c 87.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +15: 3 40.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +15: 4 44.0c 84.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +15: 5 47.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +15: 6 43.0c 88.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +15: 7 46.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +15: ================================================================================ +15: ============================= End of ROCm SMI Log ============================== +13: +13: +13: ======================= ROCm System Management Interface ======================= +13: ================================= Concise Info ================================= +13: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +13: 0 45.0c 87.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +13: 1 45.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +13: 2 38.0c 87.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +13: 3 41.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +13: 4 43.0c 80.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +13: 5 46.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +13: 6 43.0c 87.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +13: 7 45.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +13: ================================================================================ +13: ============================= End of ROCm SMI Log ============================== +21: +21: +21: ======================= ROCm System Management Interface ======================= +21: ================================= Concise Info ================================= +21: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +21: 0 45.0c 91.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +21: 1 50.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +21: 2 43.0c 87.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +21: 3 42.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +21: 4 40.0c 90.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +21: 5 50.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +21: 6 43.0c 94.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +21: 7 41.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +21: ================================================================================ +21: ============================= End of ROCm SMI Log ============================== +19: +19: +19: ======================= ROCm System Management Interface ======================= +19: ================================= Concise Info ================================= +19: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +19: 0 41.0c 88.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +19: 1 48.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +19: 2 41.0c 92.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +19: 3 42.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +19: 4 44.0c 83.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +19: 5 46.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +19: 6 37.0c 90.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +19: 7 42.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +19: ================================================================================ +19: ============================= End of ROCm SMI Log ============================== +22: +22: +22: ======================= ROCm System Management Interface ======================= +22: ================================= Concise Info ================================= +22: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +22: 0 42.0c 91.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +22: 1 51.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +22: 2 40.0c 89.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +22: 3 46.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +22: 4 42.0c 88.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +22: 5 48.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +22: 6 40.0c 91.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +22: 7 41.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +22: ================================================================================ +22: ============================= End of ROCm SMI Log ============================== + 9: + 9: + 9: ======================= ROCm System Management Interface ======================= + 9: ================================= Concise Info ================================= + 9: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% + 9: 0 43.0c 90.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 9: 1 47.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 9: 2 40.0c 86.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 9: 3 43.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 9: 4 44.0c 88.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 9: 5 42.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 9: 6 41.0c 90.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 9: 7 42.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 9: ================================================================================ + 9: ============================= End of ROCm SMI Log ============================== +18: +18: +18: ======================= ROCm System Management Interface ======================= +18: ================================= Concise Info ================================= +18: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +18: 0 45.0c 86.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +18: 1 45.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +18: 2 39.0c 92.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +18: 3 42.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +18: 4 43.0c 83.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +18: 5 46.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +18: 6 38.0c 85.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +18: 7 41.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +18: ================================================================================ +18: ============================= End of ROCm SMI Log ============================== +30: +30: +30: ======================= ROCm System Management Interface ======================= +30: ================================= Concise Info ================================= +30: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +30: 0 38.0c 91.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +30: 1 45.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +30: 2 41.0c 88.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +30: 3 46.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +30: 4 42.0c 86.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +30: 5 44.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +30: 6 42.0c 87.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +30: 7 43.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +30: ================================================================================ +30: ============================= End of ROCm SMI Log ============================== +24: +24: +24: ======================= ROCm System Management Interface ======================= +24: ================================= Concise Info ================================= +24: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +24: 0 48.0c 101.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +24: 1 46.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +24: 2 41.0c 96.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +24: 3 47.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +24: 4 41.0c 87.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +24: 5 44.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +24: 6 41.0c 84.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +24: 7 46.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +24: ================================================================================ +24: ============================= End of ROCm SMI Log ============================== +12: +12: +12: ======================= ROCm System Management Interface ======================= +12: ================================= Concise Info ================================= +12: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +12: 0 44.0c 95.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +12: 1 44.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +12: 2 39.0c 83.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +12: 3 44.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +12: 4 43.0c 88.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +12: 5 44.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +12: 6 42.0c 85.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +12: 7 43.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +12: ================================================================================ +12: ============================= End of ROCm SMI Log ============================== +31: +31: +31: ======================= ROCm System Management Interface ======================= +31: ================================= Concise Info ================================= +31: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +31: 0 42.0c 93.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +31: 1 46.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +31: 2 43.0c 93.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +31: 3 43.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +31: 4 43.0c 87.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +31: 5 47.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +31: 6 40.0c 88.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +31: 7 46.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +31: ================================================================================ +31: ============================= End of ROCm SMI Log ============================== + 4: + 4: + 4: ======================= ROCm System Management Interface ======================= + 4: ================================= Concise Info ================================= + 4: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% + 4: 0 45.0c 95.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 4: 1 44.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 4: 2 41.0c 89.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 4: 3 44.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 4: 4 38.0c 88.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 4: 5 41.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 4: 6 40.0c 91.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 4: 7 41.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 4: ================================================================================ + 4: ============================= End of ROCm SMI Log ============================== +10: +10: +10: ======================= ROCm System Management Interface ======================= +10: ================================= Concise Info ================================= +10: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +10: 0 47.0c 90.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +10: 1 48.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +10: 2 45.0c 91.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +10: 3 43.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +10: 4 43.0c 90.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +10: 5 44.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +10: 6 41.0c 87.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +10: 7 42.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +10: ================================================================================ +10: ============================= End of ROCm SMI Log ============================== +17: +17: +17: ======================= ROCm System Management Interface ======================= +17: ================================= Concise Info ================================= +17: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +17: 0 48.0c 97.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +17: 1 45.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +17: 2 42.0c 90.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +17: 3 39.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +17: 4 42.0c 91.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +17: 5 43.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +17: 6 45.0c 94.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +17: 7 48.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +17: ================================================================================ +17: ============================= End of ROCm SMI Log ============================== + 5: + 5: + 5: ======================= ROCm System Management Interface ======================= + 5: ================================= Concise Info ================================= + 5: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% + 5: 0 39.0c 90.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 5: 1 44.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 5: 2 40.0c 90.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 5: 3 45.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 5: 4 40.0c 87.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 5: 5 43.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 5: 6 42.0c 89.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 5: 7 46.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 5: ================================================================================ + 5: ============================= End of ROCm SMI Log ============================== +29: +29: +29: ======================= ROCm System Management Interface ======================= +29: ================================= Concise Info ================================= +29: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +29: 0 46.0c 90.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +29: 1 48.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +29: 2 41.0c 87.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +29: 3 48.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +29: 4 42.0c 86.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +29: 5 46.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +29: 6 40.0c 88.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +29: 7 43.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +29: ================================================================================ +29: ============================= End of ROCm SMI Log ============================== +23: +23: +23: ======================= ROCm System Management Interface ======================= +23: ================================= Concise Info ================================= +23: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +23: 0 50.0c 93.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +23: 1 47.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +23: 2 40.0c 93.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +23: 3 46.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +23: 4 42.0c 87.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +23: 5 46.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +23: 6 35.0c 87.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +23: 7 41.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +23: ================================================================================ +23: ============================= End of ROCm SMI Log ============================== +11: +11: +11: ======================= ROCm System Management Interface ======================= +11: ================================= Concise Info ================================= +11: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +11: 0 48.0c 89.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +11: 1 49.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +11: 2 39.0c 91.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +11: 3 45.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +11: 4 44.0c 87.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +11: 5 45.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +11: 6 39.0c 85.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +11: 7 46.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +11: ================================================================================ +11: ============================= End of ROCm SMI Log ============================== + 7: + 7: + 7: ======================= ROCm System Management Interface ======================= + 7: ================================= Concise Info ================================= + 7: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% + 7: 0 45.0c 86.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 7: 1 51.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 7: 2 40.0c 89.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 7: 3 40.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 7: 4 40.0c 91.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 7: 5 48.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 7: 6 39.0c 89.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 7: 7 47.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 7: ================================================================================ + 7: ============================= End of ROCm SMI Log ============================== + 6: + 6: + 6: ======================= ROCm System Management Interface ======================= + 6: ================================= Concise Info ================================= + 6: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% + 6: 0 38.0c 90.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 6: 1 45.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 6: 2 40.0c 93.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 6: 3 44.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 6: 4 44.0c 84.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 6: 5 44.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 6: 6 39.0c 82.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 6: 7 46.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 6: ================================================================================ + 6: ============================= End of ROCm SMI Log ============================== +27: +27: +27: ======================= ROCm System Management Interface ======================= +27: ================================= Concise Info ================================= +27: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +27: 0 38.0c 94.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +27: 1 43.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +27: 2 40.0c 88.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +27: 3 53.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +27: 4 40.0c 92.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +27: 5 47.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +27: 6 45.0c 96.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +27: 7 41.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +27: ================================================================================ +27: ============================= End of ROCm SMI Log ============================== +16: +16: +16: ======================= ROCm System Management Interface ======================= +16: ================================= Concise Info ================================= +16: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +16: 0 49.0c 88.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +16: 1 52.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +16: 2 40.0c 90.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +16: 3 47.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +16: 4 39.0c 85.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +16: 5 48.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +16: 6 44.0c 84.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +16: 7 43.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +16: ================================================================================ +16: ============================= End of ROCm SMI Log ============================== +30: Launching on nid005683 (30/32), master nid005048 port 9999, GPUs 8, CUDA: True + 8: Launching on nid005056 (8/32), master nid005048 port 9999, GPUs 8, CUDA: True +20: Launching on nid005673 (20/32), master nid005048 port 9999, GPUs 8, CUDA: True + 9: Launching on nid005057 (9/32), master nid005048 port 9999, GPUs 8, CUDA: True +26: Launching on nid005679 (26/32), master nid005048 port 9999, GPUs 8, CUDA: True + 1: Launching on nid005049 (1/32), master nid005048 port 9999, GPUs 8, CUDA: True + 3: Launching on nid005051 (3/32), master nid005048 port 9999, GPUs 8, CUDA: True +21: Launching on nid005674 (21/32), master nid005048 port 9999, GPUs 8, CUDA: True +31: Launching on nid005684 (31/32), master nid005048 port 9999, GPUs 8, CUDA: True +12: Launching on nid005060 (12/32), master nid005048 port 9999, GPUs 8, CUDA: True +11: Launching on nid005059 (11/32), master nid005048 port 9999, GPUs 8, CUDA: True +19: Launching on nid005067 (19/32), master nid005048 port 9999, GPUs 8, CUDA: True +14: Launching on nid005062 (14/32), master nid005048 port 9999, GPUs 8, CUDA: True +22: Launching on nid005675 (22/32), master nid005048 port 9999, GPUs 8, CUDA: True + 0: Launching on nid005048 (0/32), master nid005048 port 9999, GPUs 8, CUDA: True +18: Launching on nid005066 (18/32), master nid005048 port 9999, GPUs 8, CUDA: True +13: Launching on nid005061 (13/32), master nid005048 port 9999, GPUs 8, CUDA: True +25: Launching on nid005678 (25/32), master nid005048 port 9999, GPUs 8, CUDA: True +24: Launching on nid005677 (24/32), master nid005048 port 9999, GPUs 8, CUDA: True +10: Launching on nid005058 (10/32), master nid005048 port 9999, GPUs 8, CUDA: True + 2: Launching on nid005050 (2/32), master nid005048 port 9999, GPUs 8, CUDA: True +28: Launching on nid005681 (28/32), master nid005048 port 9999, GPUs 8, CUDA: True +15: Launching on nid005063 (15/32), master nid005048 port 9999, GPUs 8, CUDA: True + 7: Launching on nid005055 (7/32), master nid005048 port 9999, GPUs 8, CUDA: True +29: Launching on nid005682 (29/32), master nid005048 port 9999, GPUs 8, CUDA: True + 6: Launching on nid005054 (6/32), master nid005048 port 9999, GPUs 8, CUDA: True + 4: Launching on nid005052 (4/32), master nid005048 port 9999, GPUs 8, CUDA: True +17: Launching on nid005065 (17/32), master nid005048 port 9999, GPUs 8, CUDA: True +16: Launching on nid005064 (16/32), master nid005048 port 9999, GPUs 8, CUDA: True +27: Launching on nid005680 (27/32), master nid005048 port 9999, GPUs 8, CUDA: True +23: Launching on nid005676 (23/32), master nid005048 port 9999, GPUs 8, CUDA: True + 5: Launching on nid005053 (5/32), master nid005048 port 9999, GPUs 8, CUDA: True + 0: using world size: 256, data-parallel-size: 128, tensor-model-parallel size: 2, pipeline-model-parallel size: 1 + 0: accumulate and all-reduce gradients in fp32 for bfloat16 data type. + 0: using torch.bfloat16 for parameters ... + 0: ------------------------ arguments ------------------------ + 0: abort_on_unmet_fused_kernel_constraints ......... False + 0: accumulate_allreduce_grads_in_fp32 .............. True + 0: adam_beta1 ...................................... 0.9 + 0: adam_beta2 ...................................... 0.999 + 0: adam_eps ........................................ 1e-08 + 0: adlr_autoresume ................................. False + 0: adlr_autoresume_interval ........................ 1000 + 0: apply_query_key_layer_scaling ................... True + 0: apply_residual_connection_post_layernorm ........ False + 0: attention_dropout ............................... 0.1 + 0: attention_softmax_in_fp32 ....................... False + 0: bert_binary_head ................................ True + 0: bert_load ....................................... None + 0: bf16 ............................................ True + 0: bias_dropout_fusion ............................. True + 0: bias_gelu_fusion ................................ True + 0: biencoder_projection_dim ........................ 0 + 0: biencoder_shared_query_context_model ............ False + 0: block_data_path ................................. None + 0: checkpoint_activations .......................... False + 0: checkpoint_in_cpu ............................... False + 0: checkpoint_num_layers ........................... 1 + 0: clip_grad ....................................... 1.0 + 0: codecarbon_dir .................................. None + 0: consumed_train_samples .......................... 0 + 0: consumed_train_tokens ........................... 0 + 0: consumed_valid_samples .......................... 0 + 0: contigious_checkpointing ........................ False + 0: cpu_optimizer ................................... False + 0: cpu_torch_adam .................................. False + 0: curriculum_learning ............................. False + 0: data_impl ....................................... mmap + 0: data_parallel_size .............................. 128 + 0: data_path ....................................... None + 0: dataloader_type ................................. single + 0: DDP_impl ........................................ local + 0: decoder_seq_length .............................. None + 0: deepscale ....................................... False + 0: deepscale_config ................................ None + 0: deepspeed ....................................... True + 0: deepspeed_activation_checkpointing .............. False + 0: deepspeed_config ................................ ds_configs/3491058.json + 0: deepspeed_mpi ................................... False + 0: distribute_checkpointed_activations ............. False + 0: distributed_backend ............................. nccl + 0: embed_layernorm ................................. False + 0: embedding_path .................................. None + 0: encoder_seq_length .............................. 2048 + 0: eod_mask_loss ................................... False + 0: eval_interval ................................... 1 + 0: eval_iters ...................................... 100 + 0: eval_only ....................................... True + 0: evidence_data_path .............................. None + 0: exit_duration_in_mins ........................... None + 0: exit_interval ................................... None + 0: ffn_hidden_size ................................. 10240 + 0: finetune ........................................ False + 0: fp16 ............................................ False + 0: fp16_lm_cross_entropy ........................... False + 0: fp32_residual_connection ........................ False + 0: gigaflos_no_embeds .............................. 0 + 0: global_batch_size ............................... 1024 + 0: glu_activation .................................. None + 0: hidden_dropout .................................. 0.1 + 0: hidden_size ..................................... 2560 + 0: hysteresis ...................................... 2 + 0: ict_head_size ................................... None + 0: ict_load ........................................ None + 0: img_dim ......................................... 224 + 0: indexer_batch_size .............................. 128 + 0: indexer_log_interval ............................ 1000 + 0: inference ....................................... False + 0: init_method_std ................................. 0.02 + 0: init_method_xavier_uniform ...................... False + 0: initial_loss_scale .............................. 4294967296 + 0: kill_switch_path ................................ kill-switch-4b284b84bperplexity25val + 0: kv_channels ..................................... 128 + 0: layer_norm_fusion ............................... True + 0: layernorm_epsilon ............................... 1e-05 + 0: lazy_mpu_init ................................... None + 0: load ............................................ lm1-4b2-84b-c4-perplexity/perplexity25 + 0: local_rank ...................................... None + 0: log_batch_size_to_tensorboard ................... True + 0: log_interval .................................... 10 + 0: log_learning_rate_to_tensorboard ................ True + 0: log_level ....................................... None + 0: log_level_replica ............................... None + 0: log_loss_scale_to_tensorboard ................... True + 0: log_num_zeros_in_grad ........................... False + 0: log_params_norm ................................. False + 0: log_path ........................................ None + 0: log_timers_to_tensorboard ....................... True + 0: log_validation_ppl_to_tensorboard ............... True + 0: loss_on_targets_only ............................ False + 0: loss_scale ...................................... None + 0: loss_scale_window ............................... 1000 + 0: lr .............................................. 0.0002 + 0: lr_decay_iters .................................. None + 0: lr_decay_samples ................................ 1 + 0: lr_decay_style .................................. cosine + 0: lr_decay_tokens ................................. None + 0: lr_warmup_fraction .............................. None + 0: lr_warmup_iters ................................. 0 + 0: lr_warmup_samples ............................... 0 + 0: make_vocab_size_divisible_by .................... 128 + 0: mask_prob ....................................... 0.15 + 0: masked_softmax_fusion ........................... True + 0: max_position_embeddings ......................... 2048 + 0: mean_noise_span_length .......................... None + 0: memory_centric_tiled_linear ..................... False + 0: merge_file ...................................... gpt2/merges.txt + 0: micro_batch_size ................................ 2 + 0: min_loss_scale .................................. 1.0 + 0: min_lr .......................................... 2e-05 + 0: mmap_warmup ..................................... False + 0: no_load_optim ................................... True + 0: no_load_rng ..................................... None + 0: no_save_optim ................................... None + 0: no_save_rng ..................................... None + 0: noise_density ................................... None + 0: num_attention_heads ............................. 20 + 0: num_channels .................................... 3 + 0: num_classes ..................................... 1000 + 0: num_layers ...................................... 34 + 0: num_layers_per_virtual_pipeline_stage ........... None + 0: num_workers ..................................... 2 + 0: onnx_safe ....................................... None + 0: openai_gelu ..................................... False + 0: optimizer ....................................... adam + 0: optimizer_fusion ................................ True + 0: override_lr_scheduler ........................... True + 0: pad_vocab_size_to ............................... None + 0: params_dtype .................................... torch.bfloat16 + 0: partition_activations ........................... False + 0: patch_dim ....................................... 16 + 0: pipeline_model_parallel_size .................... 1 + 0: position_embedding_type ......................... PositionEmbeddingType.absolute + 0: pp_partition_method ............................. None + 0: profile_backward ................................ False + 0: query_in_block_prob ............................. 0.1 + 0: rampup_batch_size ............................... None + 0: rank ............................................ 0 + 0: remote_device ................................... none + 0: reset_attention_mask ............................ False + 0: reset_position_ids .............................. False + 0: reset_progress .................................. True + 0: retriever_report_topk_accuracies ................ [] + 0: retriever_score_scaling ......................... False + 0: retriever_seq_length ............................ 256 + 0: reweight_loss_based_on_position_frequency ....... False + 0: sample_rate ..................................... 1.0 + 0: save ............................................ lm1-4b2-84b-c4-perplexity/perplexity25 + 0: save_interval ................................... 1000 + 0: scatter_gather_tensors_in_pipeline .............. True + 0: scattered_embeddings ............................ False + 0: seed ............................................ 1234 + 0: seq_length ...................................... 2048 + 0: sgd_momentum .................................... 0.9 + 0: short_seq_prob .................................. 0.1 + 0: skip_train_iteration_range ...................... None + 0: split ........................................... None + 0: split_transformers .............................. False + 0: sync_tp_duplicated_parameters ................... False + 0: synchronize_each_layer .......................... False + 0: tensor_model_parallel_size ...................... 2 + 0: tensorboard_dir ................................. tensorboard_4b284b84bperplexity25val + 0: tensorboard_log_interval ........................ 1 + 0: tensorboard_queue_size .......................... 5 + 0: test_weighted_split_paths ....................... None + 0: test_weighted_split_paths_path .................. None + 0: tile_factor ..................................... 1 + 0: titles_data_path ................................ None + 0: tokenizer_name_or_path .......................... None + 0: tokenizer_type .................................. GPT2BPETokenizer + 0: train_iters ..................................... None + 0: train_samples ................................... 1 + 0: train_tokens .................................... None + 0: train_weighted_split_names ...................... ['train'] + 0: train_weighted_split_paths ...................... [['/scratch/project_462000119/data/c4_subsampled/gpt2tok_c4_en_1B5_text_document']] + 0: train_weighted_split_paths_path ................. None + 0: train_weighted_split_splits ..................... [['0:1']] + 0: train_weighted_split_weights .................... [['1.0']] + 0: universal_checkpoint ............................ False + 0: use_bnb_optimizer ............................... False + 0: use_checkpoint_lr_scheduler ..................... False + 0: use_contiguous_buffers_in_ddp ................... True + 0: use_cpu_initialization .......................... None + 0: use_one_sent_docs ............................... False + 0: use_pin_memory .................................. False + 0: valid_num_workers ............................... 2 + 0: valid_weighted_split_names ...................... ['validation'] + 0: valid_weighted_split_paths ...................... [['/scratch/project_462000119/data/c4_validation/gpt2tok_c4validation_rerun_text_document']] + 0: valid_weighted_split_paths_path ................. None + 0: valid_weighted_split_splits ..................... [['0:1']] + 0: valid_weighted_split_weights .................... [['1.0']] + 0: virtual_pipeline_model_parallel_size ............ None + 0: vocab_extra_ids ................................. 0 + 0: vocab_file ...................................... gpt2/vocab.json + 0: weight_decay .................................... 0.1 + 0: world_size ...................................... 256 + 0: zero_allgather_bucket_size ...................... 0.0 + 0: zero_contigious_gradients ....................... False + 0: zero_reduce_bucket_size ......................... 0.0 + 0: zero_reduce_scatter ............................. False + 0: zero_stage ...................................... 0 + 0: -------------------- end of arguments --------------------- + 0: setting number of micro-batches to constant 4 + 0: > building GPT2BPETokenizer tokenizer ... + 0: > padded vocab (size: 50257) with 175 dummy tokens (new size: 50432) + 0: DeepSpeed general environment info: + 0: torch install path ............... ['/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch'] + 0: torch version .................... 1.13.0+rocm5.2 + 0: torch cuda version ............... None + 0: torch hip version ................ 5.2.21151-afdc89f8 + 0: nvcc version ..................... None + 0: deepspeed install path ........... ['/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/deepspeed'] + 0: deepspeed info ................... 0.7.5, unknown, unknown + 0: deepspeed wheel compiled w. ...... torch 1.13, hip 5.1 + 0: **** Git info for Megatron: git_hash=unknown git_branch=unknown **** + 0: > initializing torch distributed ... + 0: [2023-05-10 12:36:51,927] [INFO] [comm.py:633:init_distributed] Initializing TorchBackend in DeepSpeed with backend nccl +31: > setting tensorboard ... + 0: > initializing tensor model parallel with size 2 + 0: > initializing pipeline model parallel with size 1 + 0: > setting random seeds to 1234 ... + 0: > initializing model parallel cuda seeds on global rank 0, model parallel rank 0, and data parallel rank 0 with model parallel seed: 3952 and data parallel seed: 1234 + 0: > compiling dataset index builder ... + 0: make: Entering directory '/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/data' + 0: make: Nothing to be done for 'default'. + 0: make: Leaving directory '/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/data' + 0: >>> done with dataset index builder. Compilation time: 0.100 seconds + 0: > compiling and loading fused kernels ... + 0: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/scaled_upper_triang_masked_softmax.cpp -> /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/scaled_upper_triang_masked_softmax_hip.cpp [skipped, already hipified] + 0: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/scaled_upper_triang_masked_softmax.h -> /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/scaled_upper_triang_masked_softmax_hip.h [skipped, already hipified] + 0: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/compat.h -> /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/compat.h [skipped, no changes] + 0: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/type_shim.h -> /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/type_shim.h [skipped, no changes] + 0: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/scaled_upper_triang_masked_softmax_cuda.cu -> /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/scaled_upper_triang_masked_softmax_hip.hip [skipped, already hipified] + 0: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/type_shim.h -> /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/type_shim.h [skipped, no changes] + 0: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/compat.h -> /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/compat.h [skipped, no changes] + 0: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/scaled_upper_triang_masked_softmax.h -> /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/scaled_upper_triang_masked_softmax_hip.h [skipped, already hipified] + 0: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/scaled_masked_softmax.h -> /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/scaled_masked_softmax_hip.h [skipped, already hipified] + 0: Total number of unsupported CUDA function calls: 0 + 0: + 0: + 0: Total number of replaced kernel launches: 87 + 0: ninja: no work to do. + 0: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/scaled_masked_softmax.cpp -> /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/scaled_masked_softmax_hip.cpp [skipped, already hipified] + 0: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/scaled_masked_softmax_cuda.cu -> /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/scaled_masked_softmax_hip.hip [skipped, already hipified] + 0: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/type_shim.h -> /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/type_shim.h [skipped, no changes] + 0: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/compat.h -> /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/compat.h [skipped, no changes] + 0: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/scaled_upper_triang_masked_softmax.h -> /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/scaled_upper_triang_masked_softmax_hip.h [skipped, already hipified] + 0: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/scaled_masked_softmax.h -> /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/scaled_masked_softmax_hip.h [skipped, already hipified] + 0: Total number of unsupported CUDA function calls: 0 + 0: + 0: + 0: Total number of replaced kernel launches: 63 + 0: ninja: no work to do. + 0: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/layer_norm_cuda.cpp -> /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/layer_norm_cuda.cpp [skipped, no changes] + 0: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/layer_norm_cuda_kernel.cu -> /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/layer_norm_hip_kernel.hip [skipped, already hipified] + 0: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/type_shim.h -> /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/type_shim.h [skipped, no changes] + 0: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/compat.h -> /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/compat.h [skipped, no changes] + 0: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/scaled_upper_triang_masked_softmax.h -> /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/scaled_upper_triang_masked_softmax_hip.h [skipped, already hipified] + 0: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/scaled_masked_softmax.h -> /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/scaled_masked_softmax_hip.h [skipped, already hipified] + 0: Total number of unsupported CUDA function calls: 0 + 0: + 0: + 0: Total number of replaced kernel launches: 67 + 0: [1/1] c++ layer_norm_cuda.o layer_norm_hip_kernel.cuda.o -shared -L/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/lib -lc10 -lc10_hip -ltorch_cpu -ltorch_hip -ltorch -ltorch_python -L/opt/rocm/lib -lamdhip64 -o fused_mix_prec_layer_norm_cuda.so + 0: >>> done with compiling and loading fused kernels. Compilation time: 19.604 seconds + 0: time to initialize megatron (seconds): 80.147 + 0: [after megatron is initialized] datetime: 2023-05-10 12:37:20 + 0: building GPT model ... + 0: [2023-05-10 12:37:20,326] [INFO] [utils.py:827:see_memory_usage] Before Building Model + 0: [2023-05-10 12:37:20,327] [INFO] [utils.py:828:see_memory_usage] MA 0.0 GB Max_MA 0.0 GB CA 0.0 GB Max_CA 0 GB + 0: [2023-05-10 12:37:20,327] [INFO] [utils.py:836:see_memory_usage] CPU Virtual Memory: used = 38.96 GB, percent = 7.7% + 0: SEED_LAYERS=False BASE_SEED=1234 SEED_FN=None + 0: Using topology: {ProcessCoord(pipe=0, data=0, model=0): 0, ProcessCoord(pipe=0, data=0, model=1): 1, ProcessCoord(pipe=0, data=1, model=0): 2, ProcessCoord(pipe=0, data=1, model=1): 3, ProcessCoord(pipe=0, data=2, model=0): 4, ProcessCoord(pipe=0, data=2, model=1): 5, ProcessCoord(pipe=0, data=3, model=0): 6, ProcessCoord(pipe=0, data=3, model=1): 7, ProcessCoord(pipe=0, data=4, model=0): 8, ProcessCoord(pipe=0, data=4, model=1): 9, ProcessCoord(pipe=0, data=5, model=0): 10, ProcessCoord(pipe=0, data=5, model=1): 11, ProcessCoord(pipe=0, data=6, model=0): 12, ProcessCoord(pipe=0, data=6, model=1): 13, ProcessCoord(pipe=0, data=7, model=0): 14, ProcessCoord(pipe=0, data=7, model=1): 15, ProcessCoord(pipe=0, data=8, model=0): 16, ProcessCoord(pipe=0, data=8, model=1): 17, ProcessCoord(pipe=0, data=9, model=0): 18, ProcessCoord(pipe=0, data=9, model=1): 19, ProcessCoord(pipe=0, data=10, model=0): 20, ProcessCoord(pipe=0, data=10, model=1): 21, ProcessCoord(pipe=0, data=11, model=0): 22, ProcessCoord(pipe=0, data + 0: =11, model=1): 23, ProcessCoord(pipe=0, data=12, model=0): 24, ProcessCoord(pipe=0, data=12, model=1): 25, ProcessCoord(pipe=0, data=13, model=0): 26, ProcessCoord(pipe=0, data=13, model=1): 27, ProcessCoord(pipe=0, data=14, model=0): 28, ProcessCoord(pipe=0, data=14, model=1): 29, ProcessCoord(pipe=0, data=15, model=0): 30, ProcessCoord(pipe=0, data=15, model=1): 31, ProcessCoord(pipe=0, data=16, model=0): 32, ProcessCoord(pipe=0, data=16, model=1): 33, ProcessCoord(pipe=0, data=17, model=0): 34, ProcessCoord(pipe=0, data=17, model=1): 35, ProcessCoord(pipe=0, data=18, model=0): 36, ProcessCoord(pipe=0, data=18, model=1): 37, ProcessCoord(pipe=0, data=19, model=0): 38, ProcessCoord(pipe=0, data=19, model=1): 39, ProcessCoord(pipe=0, data=20, model=0): 40, ProcessCoord(pipe=0, data=20, model=1): 41, ProcessCoord(pipe=0, data=21, model=0): 42, ProcessCoord(pipe=0, data=21, model=1): 43, ProcessCoord(pipe=0, data=22, model=0): 44, ProcessCoord(pipe=0, data=22, model=1): 45, ProcessCoord(pipe=0, data=23, model=0 + 0: ): 46, ProcessCoord(pipe=0, data=23, model=1): 47, ProcessCoord(pipe=0, data=24, model=0): 48, ProcessCoord(pipe=0, data=24, model=1): 49, ProcessCoord(pipe=0, data=25, model=0): 50, ProcessCoord(pipe=0, data=25, model=1): 51, ProcessCoord(pipe=0, data=26, model=0): 52, ProcessCoord(pipe=0, data=26, model=1): 53, ProcessCoord(pipe=0, data=27, model=0): 54, ProcessCoord(pipe=0, data=27, model=1): 55, ProcessCoord(pipe=0, data=28, model=0): 56, ProcessCoord(pipe=0, data=28, model=1): 57, ProcessCoord(pipe=0, data=29, model=0): 58, ProcessCoord(pipe=0, data=29, model=1): 59, ProcessCoord(pipe=0, data=30, model=0): 60, ProcessCoord(pipe=0, data=30, model=1): 61, ProcessCoord(pipe=0, data=31, model=0): 62, ProcessCoord(pipe=0, data=31, model=1): 63, ProcessCoord(pipe=0, data=32, model=0): 64, ProcessCoord(pipe=0, data=32, model=1): 65, ProcessCoord(pipe=0, data=33, model=0): 66, ProcessCoord(pipe=0, data=33, model=1): 67, ProcessCoord(pipe=0, data=34, model=0): 68, ProcessCoord(pipe=0, data=34, model=1): 69, Proce + 0: ssCoord(pipe=0, data=35, model=0): 70, ProcessCoord(pipe=0, data=35, model=1): 71, ProcessCoord(pipe=0, data=36, model=0): 72, ProcessCoord(pipe=0, data=36, model=1): 73, ProcessCoord(pipe=0, data=37, model=0): 74, ProcessCoord(pipe=0, data=37, model=1): 75, ProcessCoord(pipe=0, data=38, model=0): 76, ProcessCoord(pipe=0, data=38, model=1): 77, ProcessCoord(pipe=0, data=39, model=0): 78, ProcessCoord(pipe=0, data=39, model=1): 79, ProcessCoord(pipe=0, data=40, model=0): 80, ProcessCoord(pipe=0, data=40, model=1): 81, ProcessCoord(pipe=0, data=41, model=0): 82, ProcessCoord(pipe=0, data=41, model=1): 83, ProcessCoord(pipe=0, data=42, model=0): 84, ProcessCoord(pipe=0, data=42, model=1): 85, ProcessCoord(pipe=0, data=43, model=0): 86, ProcessCoord(pipe=0, data=43, model=1): 87, ProcessCoord(pipe=0, data=44, model=0): 88, ProcessCoord(pipe=0, data=44, model=1): 89, ProcessCoord(pipe=0, data=45, model=0): 90, ProcessCoord(pipe=0, data=45, model=1): 91, ProcessCoord(pipe=0, data=46, model=0): 92, ProcessCoord(pipe + 0: =0, data=46, model=1): 93, ProcessCoord(pipe=0, data=47, model=0): 94, ProcessCoord(pipe=0, data=47, model=1): 95, ProcessCoord(pipe=0, data=48, model=0): 96, ProcessCoord(pipe=0, data=48, model=1): 97, ProcessCoord(pipe=0, data=49, model=0): 98, ProcessCoord(pipe=0, data=49, model=1): 99, ProcessCoord(pipe=0, data=50, model=0): 100, ProcessCoord(pipe=0, data=50, model=1): 101, ProcessCoord(pipe=0, data=51, model=0): 102, ProcessCoord(pipe=0, data=51, model=1): 103, ProcessCoord(pipe=0, data=52, model=0): 104, ProcessCoord(pipe=0, data=52, model=1): 105, ProcessCoord(pipe=0, data=53, model=0): 106, ProcessCoord(pipe=0, data=53, model=1): 107, ProcessCoord(pipe=0, data=54, model=0): 108, ProcessCoord(pipe=0, data=54, model=1): 109, ProcessCoord(pipe=0, data=55, model=0): 110, ProcessCoord(pipe=0, data=55, model=1): 111, ProcessCoord(pipe=0, data=56, model=0): 112, ProcessCoord(pipe=0, data=56, model=1): 113, ProcessCoord(pipe=0, data=57, model=0): 114, ProcessCoord(pipe=0, data=57, model=1): 115, ProcessCoord( + 0: pipe=0, data=58, model=0): 116, ProcessCoord(pipe=0, data=58, model=1): 117, ProcessCoord(pipe=0, data=59, model=0): 118, ProcessCoord(pipe=0, data=59, model=1): 119, ProcessCoord(pipe=0, data=60, model=0): 120, ProcessCoord(pipe=0, data=60, model=1): 121, ProcessCoord(pipe=0, data=61, model=0): 122, ProcessCoord(pipe=0, data=61, model=1): 123, ProcessCoord(pipe=0, data=62, model=0): 124, ProcessCoord(pipe=0, data=62, model=1): 125, ProcessCoord(pipe=0, data=63, model=0): 126, ProcessCoord(pipe=0, data=63, model=1): 127, ProcessCoord(pipe=0, data=64, model=0): 128, ProcessCoord(pipe=0, data=64, model=1): 129, ProcessCoord(pipe=0, data=65, model=0): 130, ProcessCoord(pipe=0, data=65, model=1): 131, ProcessCoord(pipe=0, data=66, model=0): 132, ProcessCoord(pipe=0, data=66, model=1): 133, ProcessCoord(pipe=0, data=67, model=0): 134, ProcessCoord(pipe=0, data=67, model=1): 135, ProcessCoord(pipe=0, data=68, model=0): 136, ProcessCoord(pipe=0, data=68, model=1): 137, ProcessCoord(pipe=0, data=69, model=0): 138, Pr + 0: ocessCoord(pipe=0, data=69, model=1): 139, ProcessCoord(pipe=0, data=70, model=0): 140, ProcessCoord(pipe=0, data=70, model=1): 141, ProcessCoord(pipe=0, data=71, model=0): 142, ProcessCoord(pipe=0, data=71, model=1): 143, ProcessCoord(pipe=0, data=72, model=0): 144, ProcessCoord(pipe=0, data=72, model=1): 145, ProcessCoord(pipe=0, data=73, model=0): 146, ProcessCoord(pipe=0, data=73, model=1): 147, ProcessCoord(pipe=0, data=74, model=0): 148, ProcessCoord(pipe=0, data=74, model=1): 149, ProcessCoord(pipe=0, data=75, model=0): 150, ProcessCoord(pipe=0, data=75, model=1): 151, ProcessCoord(pipe=0, data=76, model=0): 152, ProcessCoord(pipe=0, data=76, model=1): 153, ProcessCoord(pipe=0, data=77, model=0): 154, ProcessCoord(pipe=0, data=77, model=1): 155, ProcessCoord(pipe=0, data=78, model=0): 156, ProcessCoord(pipe=0, data=78, model=1): 157, ProcessCoord(pipe=0, data=79, model=0): 158, ProcessCoord(pipe=0, data=79, model=1): 159, ProcessCoord(pipe=0, data=80, model=0): 160, ProcessCoord(pipe=0, data=80, model= + 0: 1): 161, ProcessCoord(pipe=0, data=81, model=0): 162, ProcessCoord(pipe=0, data=81, model=1): 163, ProcessCoord(pipe=0, data=82, model=0): 164, ProcessCoord(pipe=0, data=82, model=1): 165, ProcessCoord(pipe=0, data=83, model=0): 166, ProcessCoord(pipe=0, data=83, model=1): 167, ProcessCoord(pipe=0, data=84, model=0): 168, ProcessCoord(pipe=0, data=84, model=1): 169, ProcessCoord(pipe=0, data=85, model=0): 170, ProcessCoord(pipe=0, data=85, model=1): 171, ProcessCoord(pipe=0, data=86, model=0): 172, ProcessCoord(pipe=0, data=86, model=1): 173, ProcessCoord(pipe=0, data=87, model=0): 174, ProcessCoord(pipe=0, data=87, model=1): 175, ProcessCoord(pipe=0, data=88, model=0): 176, ProcessCoord(pipe=0, data=88, model=1): 177, ProcessCoord(pipe=0, data=89, model=0): 178, ProcessCoord(pipe=0, data=89, model=1): 179, ProcessCoord(pipe=0, data=90, model=0): 180, ProcessCoord(pipe=0, data=90, model=1): 181, ProcessCoord(pipe=0, data=91, model=0): 182, ProcessCoord(pipe=0, data=91, model=1): 183, ProcessCoord(pipe=0, data + 0: =92, model=0): 184, ProcessCoord(pipe=0, data=92, model=1): 185, ProcessCoord(pipe=0, data=93, model=0): 186, ProcessCoord(pipe=0, data=93, model=1): 187, ProcessCoord(pipe=0, data=94, model=0): 188, ProcessCoord(pipe=0, data=94, model=1): 189, ProcessCoord(pipe=0, data=95, model=0): 190, ProcessCoord(pipe=0, data=95, model=1): 191, ProcessCoord(pipe=0, data=96, model=0): 192, ProcessCoord(pipe=0, data=96, model=1): 193, ProcessCoord(pipe=0, data=97, model=0): 194, ProcessCoord(pipe=0, data=97, model=1): 195, ProcessCoord(pipe=0, data=98, model=0): 196, ProcessCoord(pipe=0, data=98, model=1): 197, ProcessCoord(pipe=0, data=99, model=0): 198, ProcessCoord(pipe=0, data=99, model=1): 199, ProcessCoord(pipe=0, data=100, model=0): 200, ProcessCoord(pipe=0, data=100, model=1): 201, ProcessCoord(pipe=0, data=101, model=0): 202, ProcessCoord(pipe=0, data=101, model=1): 203, ProcessCoord(pipe=0, data=102, model=0): 204, ProcessCoord(pipe=0, data=102, model=1): 205, ProcessCoord(pipe=0, data=103, model=0): 206, Process + 0: Coord(pipe=0, data=103, model=1): 207, ProcessCoord(pipe=0, data=104, model=0): 208, ProcessCoord(pipe=0, data=104, model=1): 209, ProcessCoord(pipe=0, data=105, model=0): 210, ProcessCoord(pipe=0, data=105, model=1): 211, ProcessCoord(pipe=0, data=106, model=0): 212, ProcessCoord(pipe=0, data=106, model=1): 213, ProcessCoord(pipe=0, data=107, model=0): 214, ProcessCoord(pipe=0, data=107, model=1): 215, ProcessCoord(pipe=0, data=108, model=0): 216, ProcessCoord(pipe=0, data=108, model=1): 217, ProcessCoord(pipe=0, data=109, model=0): 218, ProcessCoord(pipe=0, data=109, model=1): 219, ProcessCoord(pipe=0, data=110, model=0): 220, ProcessCoord(pipe=0, data=110, model=1): 221, ProcessCoord(pipe=0, data=111, model=0): 222, ProcessCoord(pipe=0, data=111, model=1): 223, ProcessCoord(pipe=0, data=112, model=0): 224, ProcessCoord(pipe=0, data=112, model=1): 225, ProcessCoord(pipe=0, data=113, model=0): 226, ProcessCoord(pipe=0, data=113, model=1): 227, ProcessCoord(pipe=0, data=114, model=0): 228, ProcessCoord(pipe=0 + 0: , data=114, model=1): 229, ProcessCoord(pipe=0, data=115, model=0): 230, ProcessCoord(pipe=0, data=115, model=1): 231, ProcessCoord(pipe=0, data=116, model=0): 232, ProcessCoord(pipe=0, data=116, model=1): 233, ProcessCoord(pipe=0, data=117, model=0): 234, ProcessCoord(pipe=0, data=117, model=1): 235, ProcessCoord(pipe=0, data=118, model=0): 236, ProcessCoord(pipe=0, data=118, model=1): 237, ProcessCoord(pipe=0, data=119, model=0): 238, ProcessCoord(pipe=0, data=119, model=1): 239, ProcessCoord(pipe=0, data=120, model=0): 240, ProcessCoord(pipe=0, data=120, model=1): 241, ProcessCoord(pipe=0, data=121, model=0): 242, ProcessCoord(pipe=0, data=121, model=1): 243, ProcessCoord(pipe=0, data=122, model=0): 244, ProcessCoord(pipe=0, data=122, model=1): 245, ProcessCoord(pipe=0, data=123, model=0): 246, ProcessCoord(pipe=0, data=123, model=1): 247, ProcessCoord(pipe=0, data=124, model=0): 248, ProcessCoord(pipe=0, data=124, model=1): 249, ProcessCoord(pipe=0, data=125, model=0): 250, ProcessCoord(pipe=0, data=125, + 0: model=1): 251, ProcessCoord(pipe=0, data=126, model=0): 252, ProcessCoord(pipe=0, data=126, model=1): 253, ProcessCoord(pipe=0, data=127, model=0): 254, ProcessCoord(pipe=0, data=127, model=1): 255} + 0: [2023-05-10 12:37:25,795] [INFO] [module.py:366:_partition_layers] Partitioning pipeline stages with method type:transformer + 0: stage=0 layers=41 + 0: 0: _to_float16 + 0: 1: EmbeddingPipe + 0: 2: + 0: 3: ParallelTransformerLayerPipe + 0: 4: ParallelTransformerLayerPipe + 0: 5: ParallelTransformerLayerPipe + 0: 6: ParallelTransformerLayerPipe + 0: 7: ParallelTransformerLayerPipe + 0: 8: ParallelTransformerLayerPipe + 0: 9: ParallelTransformerLayerPipe + 0: 10: ParallelTransformerLayerPipe + 0: 11: ParallelTransformerLayerPipe + 0: 12: ParallelTransformerLayerPipe + 0: 13: ParallelTransformerLayerPipe + 0: 14: ParallelTransformerLayerPipe + 0: 15: ParallelTransformerLayerPipe + 0: 16: ParallelTransformerLayerPipe + 0: 17: ParallelTransformerLayerPipe + 0: 18: ParallelTransformerLayerPipe + 0: 19: ParallelTransformerLayerPipe + 0: 20: ParallelTransformerLayerPipe + 0: 21: ParallelTransformerLayerPipe + 0: 22: ParallelTransformerLayerPipe + 0: 23: ParallelTransformerLayerPipe + 0: 24: ParallelTransformerLayerPipe + 0: 25: ParallelTransformerLayerPipe + 0: 26: ParallelTransformerLayerPipe + 0: 27: ParallelTransformerLayerPipe + 0: 28: ParallelTransformerLayerPipe + 0: 29: ParallelTransformerLayerPipe + 0: 30: ParallelTransformerLayerPipe + 0: 31: ParallelTransformerLayerPipe + 0: 32: ParallelTransformerLayerPipe + 0: 33: ParallelTransformerLayerPipe + 0: 34: ParallelTransformerLayerPipe + 0: 35: ParallelTransformerLayerPipe + 0: 36: ParallelTransformerLayerPipe + 0: 37: undo + 0: 38: MixedFusedLayerNorm + 0: 39: EmbeddingPipe + 0: 40: float16_to_fp32 + 0: loss: CrossEntropy + 0: [2023-05-10 12:37:26,715] [INFO] [utils.py:827:see_memory_usage] After Building Model + 0: [2023-05-10 12:37:26,716] [INFO] [utils.py:828:see_memory_usage] MA 2.7 GB Max_MA 2.7 GB CA 2.77 GB Max_CA 3 GB + 0: [2023-05-10 12:37:26,716] [INFO] [utils.py:836:see_memory_usage] CPU Virtual Memory: used = 39.16 GB, percent = 7.8% + 0: setting training iterations to 0 + 0: > learning rate decay style: cosine + 0: DeepSpeed is enabled. + 0: [2023-05-10 12:37:26,719] [INFO] [logging.py:68:log_dist] [Rank 0] DeepSpeed info: version=0.7.5, git-hash=unknown, git-branch=unknown + 0: [2023-05-10 12:37:32,546] [INFO] [logging.py:68:log_dist] [Rank 0] DeepSpeed Flops Profiler Enabled: False + 0: [2023-05-10 12:37:32,546] [INFO] [logging.py:68:log_dist] [Rank 0] Removing param_group that has no 'params' in the client Optimizer + 0: [2023-05-10 12:37:32,546] [INFO] [logging.py:68:log_dist] [Rank 0] Using client Optimizer as basic optimizer + 0: [2023-05-10 12:37:32,565] [INFO] [logging.py:68:log_dist] [Rank 0] DeepSpeed Basic Optimizer = FusedAdam + 0: [2023-05-10 12:37:32,565] [INFO] [logging.py:68:log_dist] [Rank 0] Creating BF16 optimizer + 0: [2023-05-10 12:37:32,694] [INFO] [utils.py:827:see_memory_usage] begin bf16_optimizer + 0: [2023-05-10 12:37:32,695] [INFO] [utils.py:828:see_memory_usage] MA 2.69 GB Max_MA 2.71 GB CA 2.77 GB Max_CA 3 GB + 0: [2023-05-10 12:37:32,695] [INFO] [utils.py:836:see_memory_usage] CPU Virtual Memory: used = 39.86 GB, percent = 7.9% + 1: ninja: no work to do. +25: Time to load utils op: 0.332639217376709 seconds +25: Time to load utils op: 0.33264899253845215 seconds +25: Time to load utils op: 0.33266448974609375 seconds +25: Time to load utils op: 0.33266639709472656 seconds +11: Time to load utils op: 0.36772942543029785 secondsTime to load utils op: 0.36772871017456055 seconds +11: +11: Time to load utils op: 0.3677406311035156 seconds +11: Time to load utils op: 0.3677480220794678 seconds +29: Time to load utils op: 0.35756444931030273 secondsTime to load utils op: 0.35756468772888184 secondsTime to load utils op: 0.35756635665893555 seconds +29: +29: +12: Time to load utils op: 0.3425307273864746 seconds +12: Time to load utils op: 0.34253764152526855 seconds +12: Time to load utils op: 0.3425478935241699 seconds + 1: Time to load utils op: 0.37685084342956543 secondsTime to load utils op: 0.37716078758239746 seconds + 1: + 1: Time to load utils op: 0.3769822120666504 seconds +30: Time to load utils op: 0.35715460777282715 secondsTime to load utils op: 0.3571584224700928 seconds +30: +30: Time to load utils op: 0.3571736812591553 seconds +30: Time to load utils op: 0.35718488693237305 seconds +28: Time to load utils op: 0.3609592914581299 seconds +28: Time to load utils op: 0.36142730712890625 seconds +28: Time to load utils op: 0.3607969284057617 secondsTime to load utils op: 0.36095762252807617 seconds +28: +23: Time to load utils op: 0.3593423366546631 secondsTime to load utils op: 0.35933971405029297 seconds +23: +23: Time to load utils op: 0.3593568801879883 seconds +23: Time to load utils op: 0.3593268394470215 seconds +27: Time to load utils op: 0.3591182231903076 seconds +27: Time to load utils op: 0.3591334819793701 secondsTime to load utils op: 0.3591282367706299 seconds +27: +27: Time to load utils op: 0.35292983055114746 seconds +29: Time to load utils op: 0.35757946968078613 seconds +15: Time to load utils op: 0.36794376373291016 secondsTime to load utils op: 0.36820459365844727 secondsTime to load utils op: 0.3678765296936035 seconds +15: +15: +15: Time to load utils op: 0.36810851097106934 seconds +12: Time to load utils op: 0.33321142196655273 seconds +18: Time to load utils op: 0.36737990379333496 seconds +18: Time to load utils op: 0.36780786514282227 seconds +18: Time to load utils op: 0.36739110946655273 seconds +18: Time to load utils op: 0.3677060604095459 seconds + 1: Time to load utils op: 0.3770265579223633 seconds +21: Time to load utils op: 0.36220383644104004 secondsTime to load utils op: 0.36220574378967285 seconds +21: +21: Time to load utils op: 0.3622133731842041 seconds +21: Time to load utils op: 0.36222100257873535 seconds +19: Time to load utils op: 0.36740922927856445 seconds +19: Time to load utils op: 0.36672306060791016 secondsTime to load utils op: 0.3655378818511963 seconds +19: Time to load utils op: 0.36680054664611816 seconds +19: + 7: Time to load utils op: 0.37416958808898926 secondsTime to load utils op: 0.3736860752105713 seconds + 7: + 7: Time to load utils op: 0.3740861415863037 seconds + 9: Time to load utils op: 0.37241649627685547 secondsTime to load utils op: 0.37279438972473145 seconds + 9: + 9: Time to load utils op: 0.37245893478393555 seconds +26: Time to load utils op: 0.36318445205688477 seconds +26: Time to load utils op: 0.3641805648803711 seconds +26: Time to load utils op: 0.36403346061706543 seconds +31: Time to load utils op: 0.36130237579345703 secondsTime to load utils op: 0.36101627349853516 seconds +31: +31: Time to load utils op: 0.3607017993927002 seconds + 5: Time to load utils op: 0.3743577003479004 secondsTime to load utils op: 0.3744802474975586 seconds + 5: + 5: Time to load utils op: 0.3743727207183838 seconds + 5: Time to load utils op: 0.3743295669555664 seconds + 9: Time to load utils op: 0.37178874015808105 seconds + 7: Time to load utils op: 0.37357211112976074 seconds +14: Time to load utils op: 0.37032032012939453 secondsTime to load utils op: 0.37055015563964844 seconds +14: +14: Time to load utils op: 0.36988115310668945 secondsTime to load utils op: 0.37076544761657715 seconds +14: + 3: Time to load utils op: 0.3741462230682373 seconds + 3: Time to load utils op: 0.37648487091064453 seconds +22: Time to load utils op: 0.3610038757324219 secondsTime to load utils op: 0.36099982261657715 seconds +22: +22: Time to load utils op: 0.3610093593597412 seconds +22: Time to load utils op: 0.36102986335754395 seconds +24: Time to load utils op: 0.360579252243042 seconds +24: Time to load utils op: 0.3605978488922119 seconds +26: Time to load utils op: 0.3642709255218506 seconds +31: Time to load utils op: 0.36032819747924805 seconds +13: Time to load utils op: 0.3670170307159424 secondsTime to load utils op: 0.3670179843902588 seconds +13: +13: Time to load utils op: 0.36702752113342285 seconds + 6: Time to load utils op: 0.370405912399292 seconds + 6: Time to load utils op: 0.3704216480255127 seconds + 6: Time to load utils op: 0.3704204559326172 seconds + 3: Time to load utils op: 0.3760664463043213 secondsTime to load utils op: 0.37711167335510254 seconds + 3: +24: Time to load utils op: 0.3606107234954834 secondsTime to load utils op: 0.36061835289001465 seconds +24: +17: Time to load utils op: 0.36443376541137695 seconds +17: Time to load utils op: 0.3644418716430664 secondsTime to load utils op: 0.36444735527038574 seconds +17: +17: Time to load utils op: 0.3644552230834961 seconds + 0: Time to load utils op: 0.3778562545776367 seconds + 0: Time to load utils op: 0.2663865089416504 seconds +20: Time to load utils op: 0.3664877414703369 secondsTime to load utils op: 0.36602067947387695 seconds +20: +20: Time to load utils op: 0.36640357971191406 seconds + 6: Time to load utils op: 0.37043237686157227 seconds +16: Time to load utils op: 0.369464635848999 secondsTime to load utils op: 0.3695690631866455 seconds +16: +16: Time to load utils op: 0.36881089210510254 seconds +16: Time to load utils op: 0.3686816692352295 seconds + 0: Time to load utils op: 0.3777134418487549 seconds +13: Time to load utils op: 0.36702775955200195 seconds + 0: Time to load utils op: 0.37758779525756836 seconds + 2: Time to load utils op: 0.37691664695739746 secondsTime to load utils op: 0.3769693374633789 secondsTime to load utils op: 0.37746262550354004 seconds + 2: + 2: +20: Time to load utils op: 0.3660597801208496 seconds + 4: Time to load utils op: 0.371596097946167 seconds + 4: Time to load utils op: 0.3716120719909668 seconds + 4: Time to load utils op: 0.37160778045654297 secondsTime to load utils op: 0.3716132640838623 seconds + 4: +10: Time to load utils op: 0.3721930980682373 secondsTime to load utils op: 0.37270188331604004 seconds +10: +10: Time to load utils op: 0.37309837341308594 seconds + 8: Time to load utils op: 0.3701448440551758 seconds + 8: Time to load utils op: 0.37015843391418457 seconds + 8: Time to load utils op: 0.37016773223876953 seconds +10: Time to load utils op: 0.372683048248291 seconds + 2: Time to load utils op: 0.37642574310302734 seconds + 8: Time to load utils op: 0.3701791763305664 seconds + 0: [2023-05-10 12:37:33,079] [INFO] [utils.py:827:see_memory_usage] before initializing group 0 + 0: [2023-05-10 12:37:33,079] [INFO] [utils.py:828:see_memory_usage] MA 2.69 GB Max_MA 2.69 GB CA 2.77 GB Max_CA 3 GB + 0: [2023-05-10 12:37:33,079] [INFO] [utils.py:836:see_memory_usage] CPU Virtual Memory: used = 39.86 GB, percent = 7.9% + 0: ninja: no work to do. + 0: Time to load utils op: 0.18898272514343262 seconds + 0: Time to load utils op: 0.20205450057983398 seconds + 1: Time to load utils op: 0.20298480987548828 seconds + 0: Time to load utils op: 0.2018449306488037 seconds + 1: Time to load utils op: 0.20227575302124023 seconds + 0: Time to load utils op: 0.2021491527557373 seconds + 1: Time to load utils op: 0.20249462127685547 secondsTime to load utils op: 0.20221376419067383 seconds + 1: + 2: Time to load utils op: 0.2027754783630371 seconds + 2: Time to load utils op: 0.2028944492340088 seconds + 2: Time to load utils op: 0.20226716995239258 seconds + 3: Time to load utils op: 0.20296931266784668 seconds + 3: Time to load utils op: 0.20233726501464844 seconds + 3: Time to load utils op: 0.20274758338928223 seconds + 3: Time to load utils op: 0.20252108573913574 seconds + 4: Time to load utils op: 0.20401334762573242 seconds + 4: Time to load utils op: 0.20414495468139648 seconds + 4: Time to load utils op: 0.20441889762878418 secondsTime to load utils op: 0.20424580574035645 seconds + 4: + 7: Time to load utils op: 0.20404410362243652 seconds + 7: Time to load utils op: 0.20308542251586914 seconds + 7: Time to load utils op: 0.2043914794921875 seconds + 7: Time to load utils op: 0.20435857772827148 seconds + 2: Time to load utils op: 0.20279741287231445 seconds + 6: Time to load utils op: 0.20439410209655762 seconds + 6: Time to load utils op: 0.20415520668029785 seconds + 5: Time to load utils op: 0.20480990409851074 seconds + 5: Time to load utils op: 0.2048346996307373 secondsTime to load utils op: 0.2045440673828125 seconds + 5: + 9: Time to load utils op: 0.2031106948852539 seconds + 9: Time to load utils op: 0.20396637916564941 seconds + 9: Time to load utils op: 0.20410561561584473 seconds + 6: Time to load utils op: 0.2045755386352539 seconds + 6: Time to load utils op: 0.20470261573791504 seconds + 9: Time to load utils op: 0.20426011085510254 seconds + 5: Time to load utils op: 0.20515036582946777 seconds +10: Time to load utils op: 0.2041006088256836 seconds +10: Time to load utils op: 0.20406246185302734 seconds + 8: Time to load utils op: 0.20382475852966309 seconds +10: Time to load utils op: 0.20363640785217285 seconds + 8: Time to load utils op: 0.20377612113952637 seconds + 8: Time to load utils op: 0.20392608642578125 seconds +10: Time to load utils op: 0.20490670204162598 seconds + 8: Time to load utils op: 0.20411133766174316 seconds +11: Time to load utils op: 0.20328307151794434 seconds +11: Time to load utils op: 0.2044510841369629 seconds +11: Time to load utils op: 0.20395612716674805 seconds +11: Time to load utils op: 0.2042701244354248 seconds +14: Time to load utils op: 0.20362639427185059 seconds +16: Time to load utils op: 0.20249176025390625 seconds +14: Time to load utils op: 0.20296263694763184 seconds +14: Time to load utils op: 0.2040233612060547 seconds +16: Time to load utils op: 0.20226192474365234 seconds +16: Time to load utils op: 0.20275449752807617 seconds +16: Time to load utils op: 0.2031092643737793 seconds +14: Time to load utils op: 0.20307588577270508 seconds +15: Time to load utils op: 0.20399689674377441 secondsTime to load utils op: 0.20456767082214355 seconds +15: +15: Time to load utils op: 0.2038426399230957 seconds +13: Time to load utils op: 0.2038733959197998 seconds +15: Time to load utils op: 0.20461773872375488 seconds +13: Time to load utils op: 0.20400571823120117 seconds +13: Time to load utils op: 0.20414376258850098 seconds +13: Time to load utils op: 0.20387005805969238 seconds +17: Time to load utils op: 0.20360350608825684 seconds +18: Time to load utils op: 0.20270395278930664 seconds +19: Time to load utils op: 0.2037639617919922 seconds +18: Time to load utils op: 0.20334863662719727 seconds +17: Time to load utils op: 0.20391416549682617 seconds +18: Time to load utils op: 0.20263957977294922 seconds +19: Time to load utils op: 0.20389604568481445 seconds +18: Time to load utils op: 0.20372867584228516 seconds +17: Time to load utils op: 0.20404911041259766 seconds +19: Time to load utils op: 0.2035999298095703 seconds +17: Time to load utils op: 0.20424389839172363 seconds +19: Time to load utils op: 0.20331883430480957 seconds +20: Time to load utils op: 0.20355653762817383 seconds +20: Time to load utils op: 0.20347237586975098 seconds +20: Time to load utils op: 0.2033705711364746 seconds +21: Time to load utils op: 0.2033395767211914 seconds +20: Time to load utils op: 0.20356392860412598 seconds +21: Time to load utils op: 0.20355892181396484 seconds +21: Time to load utils op: 0.20367741584777832 seconds +21: Time to load utils op: 0.20368528366088867 seconds +23: Time to load utils op: 0.2035832405090332 seconds +23: Time to load utils op: 0.20292282104492188 seconds +23: Time to load utils op: 0.20369362831115723 seconds +27: Time to load utils op: 0.20360898971557617 seconds +23: Time to load utils op: 0.2032155990600586 seconds +26: Time to load utils op: 0.20335006713867188 seconds +27: Time to load utils op: 0.203599214553833 seconds +24: Time to load utils op: 0.204329252243042 seconds +26: Time to load utils op: 0.2040543556213379 seconds +27: Time to load utils op: 0.20328307151794434 seconds +22: Time to load utils op: 0.20468688011169434 seconds +22: Time to load utils op: 0.20451045036315918 secondsTime to load utils op: 0.2046370506286621 seconds +22: +28: Time to load utils op: 0.2027754783630371 seconds +28: Time to load utils op: 0.20285749435424805 seconds +26: Time to load utils op: 0.20332765579223633 secondsTime to load utils op: 0.20302677154541016 seconds +26: +24: Time to load utils op: 0.2043747901916504 seconds +27: Time to load utils op: 0.20319724082946777 seconds +22: Time to load utils op: 0.2046675682067871 seconds +24: Time to load utils op: 0.2046375274658203 seconds +28: Time to load utils op: 0.2025928497314453 seconds +28: Time to load utils op: 0.2037639617919922 seconds +24: Time to load utils op: 0.2045581340789795 seconds +25: Time to load utils op: 0.20335006713867188 seconds +25: Time to load utils op: 0.20357799530029297 seconds +25: Time to load utils op: 0.20336675643920898 seconds +25: Time to load utils op: 0.2033534049987793 seconds +31: Time to load utils op: 0.20248079299926758 seconds +31: Time to load utils op: 0.20327448844909668 seconds +31: Time to load utils op: 0.2026991844177246 seconds +30: Time to load utils op: 0.2027895450592041 seconds +30: Time to load utils op: 0.20264363288879395 seconds +30: Time to load utils op: 0.20273113250732422 seconds +31: Time to load utils op: 0.20188188552856445 seconds +30: Time to load utils op: 0.20287466049194336 seconds +29: Time to load utils op: 0.2037065029144287 seconds +12: Time to load utils op: 0.20322203636169434 seconds +29: Time to load utils op: 0.20403051376342773 seconds +29: Time to load utils op: 0.2040705680847168 seconds +29: Time to load utils op: 0.20420289039611816 seconds +12: Time to load utils op: 0.20278525352478027 seconds +12: Time to load utils op: 0.20235013961791992 seconds +12: Time to load utils op: 0.2029123306274414 seconds +10: Time to load utils op: 0.0008211135864257812 seconds +10: Time to load utils op: 0.0007586479187011719 secondsTime to load utils op: 0.0007367134094238281 seconds +10: +10: Time to load utils op: 0.0007305145263671875 seconds +10: Time to load utils op: 0.000774383544921875 seconds +10: Time to load utils op: 0.0009572505950927734 seconds +10: Time to load utils op: 0.00087738037109375 seconds +10: Time to load utils op: 0.0008537769317626953 seconds + 0: Time to load utils op: 0.0005731582641601562 seconds + 0: Time to load utils op: 0.0005161762237548828 secondsTime to load utils op: 0.0004992485046386719 secondsTime to load utils op: 0.00049591064453125 seconds + 0: + 0: + 0: Time to load utils op: 0.00048041343688964844 seconds + 0: Time to load utils op: 0.0006129741668701172 seconds + 0: Time to load utils op: 0.0005295276641845703 seconds +16: Time to load utils op: 0.00054931640625 seconds +16: Time to load utils op: 0.0006520748138427734 secondsTime to load utils op: 0.0006704330444335938 seconds +16: + 2: Time to load utils op: 0.0007801055908203125 secondsTime to load utils op: 0.0006792545318603516 seconds + 2: + 9: Time to load utils op: 0.0008702278137207031 seconds + 2: Time to load utils op: 0.0008437633514404297 seconds + 3: Time to load utils op: 0.0006854534149169922 seconds +12: Time to load utils op: 0.0007746219635009766 seconds +16: Time to load utils op: 0.0005981922149658203 seconds + 9: Time to load utils op: 0.0008580684661865234 seconds + 2: Time to load utils op: 0.0007486343383789062 seconds +18: Time to load utils op: 0.0006632804870605469 seconds + 3: Time to load utils op: 0.0007574558258056641 seconds + 3: Time to load utils op: 0.0009548664093017578 secondsTime to load utils op: 0.0008087158203125 seconds + 3: + 3: Time to load utils op: 0.000835418701171875 seconds + 3: Time to load utils op: 0.0007872581481933594 seconds + 3: Time to load utils op: 0.0007393360137939453 seconds +13: Time to load utils op: 0.0007891654968261719 seconds +24: Time to load utils op: 0.0009953975677490234 seconds +31: Time to load utils op: 0.0008139610290527344 seconds +12: Time to load utils op: 0.00042247772216796875 secondsTime to load utils op: 0.0007646083831787109 seconds +12: +27: Time to load utils op: 0.0006084442138671875 seconds +16: Time to load utils op: 0.0006182193756103516 seconds + 3: Time to load utils op: 0.0008339881896972656 seconds + 9: Time to load utils op: 0.0009343624114990234 seconds + 2: Time to load utils op: 0.0010099411010742188 seconds +31: Time to load utils op: 0.0010352134704589844 secondsTime to load utils op: 0.0009367465972900391 seconds +31: + 9: Time to load utils op: 0.0008533000946044922 seconds +13: Time to load utils op: 0.0007195472717285156 seconds +30: Time to load utils op: 0.0008029937744140625 seconds +26: Time to load utils op: 0.0009095668792724609 seconds +12: Time to load utils op: 0.0003979206085205078 seconds +18: Time to load utils op: 0.0007193088531494141 seconds +16: Time to load utils op: 0.0006058216094970703 seconds + 1: Time to load utils op: 0.0007882118225097656 seconds + 9: Time to load utils op: 0.0009167194366455078 seconds + 9: Time to load utils op: 0.0010027885437011719 seconds +30: Time to load utils op: 0.0007026195526123047 seconds +26: Time to load utils op: 0.0009129047393798828 seconds + 2: Time to load utils op: 0.0010902881622314453 seconds + 2: Time to load utils op: 0.0011434555053710938 seconds +15: Time to load utils op: 0.0008249282836914062 seconds +30: Time to load utils op: 0.0007233619689941406 seconds +12: Time to load utils op: 0.0003910064697265625 seconds +16: Time to load utils op: 0.0006577968597412109 seconds + 1: Time to load utils op: 0.0010051727294921875 secondsTime to load utils op: 0.0008521080017089844 seconds + 1: + 1: Time to load utils op: 0.0008223056793212891 seconds + 1: Time to load utils op: 0.0009522438049316406 seconds + 1: Time to load utils op: 0.0008785724639892578 seconds + 1: Time to load utils op: 0.0010075569152832031 seconds + 9: Time to load utils op: 0.0011959075927734375 seconds + 2: Time to load utils op: 0.0010209083557128906 seconds + 8: Time to load utils op: 0.0007240772247314453 seconds +30: Time to load utils op: 0.0007505416870117188 seconds +26: Time to load utils op: 0.0009539127349853516 seconds + 5: Time to load utils op: 0.0007140636444091797 secondsTime to load utils op: 0.0006058216094970703 seconds + 5: +18: Time to load utils op: 0.0008947849273681641 seconds +23: Time to load utils op: 0.0009071826934814453 secondsTime to load utils op: 0.000919342041015625 seconds +23: +27: Time to load utils op: 0.0007684230804443359 secondsTime to load utils op: 0.0008225440979003906 secondsTime to load utils op: 0.0008270740509033203 seconds +27: +27: +16: Time to load utils op: 0.0006625652313232422 seconds + 9: Time to load utils op: 0.0011610984802246094 seconds +14: Time to load utils op: 0.0011506080627441406 seconds +14: Time to load utils op: 0.0011134147644042969 secondsTime to load utils op: 0.0010673999786376953 seconds +14: +14: Time to load utils op: 0.0010502338409423828 seconds +14: Time to load utils op: 0.0010716915130615234 seconds +22: Time to load utils op: 0.0008685588836669922 secondsTime to load utils op: 0.0009214878082275391 seconds +22: +31: Time to load utils op: 0.0008292198181152344 seconds +31: Time to load utils op: 0.0009789466857910156 seconds +12: Time to load utils op: 0.0004150867462158203 seconds + 8: Time to load utils op: 0.0007557868957519531 secondsTime to load utils op: 0.0007140636444091797 seconds + 8: +31: Time to load utils op: 0.0008158683776855469 seconds +12: Time to load utils op: 0.0007555484771728516 seconds + 7: Time to load utils op: 0.00101470947265625 seconds +27: Time to load utils op: 0.0008695125579833984 seconds +13: Time to load utils op: 0.0011734962463378906 seconds +19: Time to load utils op: 0.0008573532104492188 secondsTime to load utils op: 0.0009379386901855469 secondsTime to load utils op: 0.0010073184967041016 seconds +19: +19: +12: Time to load utils op: 0.0004010200500488281 seconds +18: Time to load utils op: 0.0010519027709960938 seconds +23: Time to load utils op: 0.0010833740234375 seconds +29: Time to load utils op: 0.000896453857421875 seconds +29: Time to load utils op: 0.0009160041809082031 seconds +20: Time to load utils op: 0.0009236335754394531 seconds +30: Time to load utils op: 0.0008714199066162109 secondsTime to load utils op: 0.000934600830078125 seconds +30: +26: Time to load utils op: 0.0010461807250976562 secondsTime to load utils op: 0.0011453628540039062 secondsTime to load utils op: 0.0011365413665771484 seconds +26: +26: +26: Time to load utils op: 0.0011801719665527344 seconds +26: Time to load utils op: 0.0011632442474365234 seconds + 5: Time to load utils op: 0.0007839202880859375 secondsTime to load utils op: 0.0007727146148681641 secondsTime to load utils op: 0.0008263587951660156 secondsTime to load utils op: 0.0007407665252685547 seconds + 5: + 5: + 5: +11: Time to load utils op: 0.000858306884765625 secondsTime to load utils op: 0.0008060932159423828 secondsTime to load utils op: 0.0008976459503173828 seconds +11: +11: +29: Time to load utils op: 0.0009465217590332031 seconds + 1: Time to load utils op: 0.0009660720825195312 seconds + 8: Time to load utils op: 0.0007951259613037109 seconds +14: Time to load utils op: 0.0013380050659179688 seconds +15: Time to load utils op: 0.00113677978515625 secondsTime to load utils op: 0.0011096000671386719 seconds +15: +15: Time to load utils op: 0.0011126995086669922 seconds +22: Time to load utils op: 0.001009225845336914 secondsTime to load utils op: 0.0010030269622802734 seconds +22: +22: Time to load utils op: 0.0010800361633300781 seconds +30: Time to load utils op: 0.0010254383087158203 seconds +28: Time to load utils op: 0.0009188652038574219 seconds +31: Time to load utils op: 0.0009379386901855469 seconds +11: Time to load utils op: 0.0009317398071289062 seconds +23: Time to load utils op: 0.0011491775512695312 seconds + 8: Time to load utils op: 0.00086212158203125 seconds +22: Time to load utils op: 0.001005411148071289 seconds +28: Time to load utils op: 0.0008955001831054688 secondsTime to load utils op: 0.0008990764617919922 seconds +28: +17: Time to load utils op: 0.0008766651153564453 seconds +18: Time to load utils op: 0.0011188983917236328 seconds +30: Time to load utils op: 0.0010957717895507812 seconds +31: Time to load utils op: 0.0011866092681884766 seconds +17: Time to load utils op: 0.0008842945098876953 seconds + 7: Time to load utils op: 0.00139617919921875 seconds +23: Time to load utils op: 0.001186370849609375 seconds +17: Time to load utils op: 0.0008826255798339844 seconds + 7: Time to load utils op: 0.0013415813446044922 seconds +14: Time to load utils op: 0.0015192031860351562 seconds +15: Time to load utils op: 0.0013756752014160156 seconds +18: Time to load utils op: 0.0014340877532958984 seconds +14: Time to load utils op: 0.0014171600341796875 seconds +15: Time to load utils op: 0.001314401626586914 seconds +22: Time to load utils op: 0.0013167858123779297 seconds +17: Time to load utils op: 0.0009953975677490234 seconds +23: Time to load utils op: 0.0014812946319580078 seconds +27: Time to load utils op: 0.0013434886932373047 seconds + 8: Time to load utils op: 0.0012769699096679688 seconds +21: Time to load utils op: 0.0014886856079101562 seconds +22: Time to load utils op: 0.0012674331665039062 seconds +19: Time to load utils op: 0.001371622085571289 secondsTime to load utils op: 0.0012924671173095703 secondsTime to load utils op: 0.0013592243194580078 seconds +19: +19: +28: Time to load utils op: 0.0013492107391357422 seconds + 5: Time to load utils op: 0.00128936767578125 seconds + 5: Time to load utils op: 0.0012791156768798828 seconds +11: Time to load utils op: 0.0013277530670166016 seconds +18: Time to load utils op: 0.0015101432800292969 seconds + 7: Time to load utils op: 0.0014958381652832031 seconds +21: Time to load utils op: 0.001477956771850586 seconds +20: Time to load utils op: 0.001255035400390625 seconds +19: Time to load utils op: 0.0013988018035888672 seconds + 7: Time to load utils op: 0.0014269351959228516 secondsTime to load utils op: 0.00147247314453125 secondsTime to load utils op: 0.0015048980712890625 seconds + 7: + 7: +23: Time to load utils op: 0.0013675689697265625 seconds +27: Time to load utils op: 0.0014204978942871094 seconds +28: Time to load utils op: 0.0013387203216552734 seconds +17: Time to load utils op: 0.0012454986572265625 seconds +11: Time to load utils op: 0.0014181137084960938 seconds +11: Time to load utils op: 0.00141143798828125 seconds + 7: Time to load utils op: 0.0014133453369140625 seconds +27: Time to load utils op: 0.0014142990112304688 seconds +29: Time to load utils op: 0.0012540817260742188 seconds + 8: Time to load utils op: 0.0013458728790283203 seconds + 8: Time to load utils op: 0.0013346672058105469 seconds +19: Time to load utils op: 0.0014641284942626953 seconds +17: Time to load utils op: 0.0014140605926513672 seconds +17: Time to load utils op: 0.0013327598571777344 seconds +18: Time to load utils op: 0.0016727447509765625 seconds + 4: Time to load utils op: 0.0021741390228271484 seconds +29: Time to load utils op: 0.001322031021118164 seconds +17: Time to load utils op: 0.0013527870178222656 seconds +11: Time to load utils op: 0.0014507770538330078 seconds + 4: Time to load utils op: 0.0024437904357910156 seconds +23: Time to load utils op: 0.0015757083892822266 seconds +29: Time to load utils op: 0.0013833045959472656 seconds +29: Time to load utils op: 0.0013759136199951172 secondsTime to load utils op: 0.0013790130615234375 seconds +29: +20: Time to load utils op: 0.0013058185577392578 seconds +28: Time to load utils op: 0.001424551010131836 seconds +28: Time to load utils op: 0.0014562606811523438 secondsTime to load utils op: 0.0014142990112304688 seconds +28: +15: Time to load utils op: 0.0018911361694335938 seconds + 4: Time to load utils op: 0.002340555191040039 seconds +15: Time to load utils op: 0.0019140243530273438 seconds +20: Time to load utils op: 0.0013108253479003906 seconds +20: Time to load utils op: 0.001268625259399414 seconds +20: Time to load utils op: 0.0013129711151123047 seconds +20: Time to load utils op: 0.0014367103576660156 seconds +25: Time to load utils op: 0.0018413066864013672 seconds + 4: Time to load utils op: 0.0019545555114746094 seconds +20: Time to load utils op: 0.0012793540954589844 seconds + 4: Time to load utils op: 0.001941680908203125 secondsTime to load utils op: 0.0018734931945800781 secondsTime to load utils op: 0.0019457340240478516 seconds + 4: + 4: + 4: Time to load utils op: 0.002195119857788086 seconds +24: Time to load utils op: 0.0024416446685791016 seconds + 6: Time to load utils op: 0.002155780792236328 seconds +21: Time to load utils op: 0.0019936561584472656 seconds +13: Time to load utils op: 0.0021729469299316406 seconds +13: Time to load utils op: 0.0022084712982177734 seconds +13: Time to load utils op: 0.0022230148315429688 seconds +21: Time to load utils op: 0.0020270347595214844 seconds +21: Time to load utils op: 0.0020170211791992188 seconds + 6: Time to load utils op: 0.0022253990173339844 seconds +13: Time to load utils op: 0.0022361278533935547 seconds +21: Time to load utils op: 0.002247333526611328 seconds +21: Time to load utils op: 0.0020737648010253906 seconds +13: Time to load utils op: 0.002246856689453125 seconds +21: Time to load utils op: 0.001974821090698242 seconds +25: Time to load utils op: 0.0024023056030273438 seconds +24: Time to load utils op: 0.0027627944946289062 seconds +25: Time to load utils op: 0.002346038818359375 seconds + 6: Time to load utils op: 0.0024673938751220703 seconds + 6: Time to load utils op: 0.002570629119873047 seconds + 6: Time to load utils op: 0.002530336380004883 secondsTime to load utils op: 0.0025506019592285156 seconds + 6: +25: Time to load utils op: 0.002159595489501953 secondsTime to load utils op: 0.0023636817932128906 seconds +25: +25: Time to load utils op: 0.0023381710052490234 seconds + 6: Time to load utils op: 0.0025081634521484375 seconds +25: Time to load utils op: 0.0023450851440429688 secondsTime to load utils op: 0.0023338794708251953 seconds +25: + 6: Time to load utils op: 0.002498149871826172 seconds +24: Time to load utils op: 0.002675294876098633 seconds +24: Time to load utils op: 0.0028111934661865234 seconds +24: Time to load utils op: 0.0028493404388427734 seconds +24: Time to load utils op: 0.003001689910888672 seconds +24: Time to load utils op: 0.003261089324951172 seconds + 0: [2023-05-10 12:37:33,886] [INFO] [utils.py:827:see_memory_usage] after initializing group 0 + 0: [2023-05-10 12:37:33,887] [INFO] [utils.py:828:see_memory_usage] MA 5.38 GB Max_MA 5.38 GB CA 6.82 GB Max_CA 7 GB + 0: [2023-05-10 12:37:33,887] [INFO] [utils.py:836:see_memory_usage] CPU Virtual Memory: used = 39.94 GB, percent = 7.9% + 0: [2023-05-10 12:37:34,001] [INFO] [utils.py:827:see_memory_usage] before initializing group 1 + 0: [2023-05-10 12:37:34,001] [INFO] [utils.py:828:see_memory_usage] MA 5.38 GB Max_MA 5.38 GB CA 6.82 GB Max_CA 7 GB + 0: [2023-05-10 12:37:34,001] [INFO] [utils.py:836:see_memory_usage] CPU Virtual Memory: used = 39.92 GB, percent = 7.9% + 0: [2023-05-10 12:37:34,111] [INFO] [utils.py:827:see_memory_usage] after initializing group 1 + 0: [2023-05-10 12:37:34,112] [INFO] [utils.py:828:see_memory_usage] MA 7.9 GB Max_MA 7.9 GB CA 10.63 GB Max_CA 11 GB + 0: [2023-05-10 12:37:34,112] [INFO] [utils.py:836:see_memory_usage] CPU Virtual Memory: used = 39.93 GB, percent = 7.9% + 0: [2023-05-10 12:37:34,216] [INFO] [utils.py:827:see_memory_usage] before initializing group 2 + 0: [2023-05-10 12:37:34,216] [INFO] [utils.py:828:see_memory_usage] MA 7.9 GB Max_MA 7.9 GB CA 10.63 GB Max_CA 11 GB + 0: [2023-05-10 12:37:34,216] [INFO] [utils.py:836:see_memory_usage] CPU Virtual Memory: used = 39.93 GB, percent = 7.9% + 0: [2023-05-10 12:37:34,323] [INFO] [utils.py:827:see_memory_usage] after initializing group 2 + 0: [2023-05-10 12:37:34,324] [INFO] [utils.py:828:see_memory_usage] MA 7.91 GB Max_MA 7.91 GB CA 10.63 GB Max_CA 11 GB + 0: [2023-05-10 12:37:34,324] [INFO] [utils.py:836:see_memory_usage] CPU Virtual Memory: used = 39.93 GB, percent = 7.9% + 0: [2023-05-10 12:37:34,425] [INFO] [utils.py:827:see_memory_usage] before initialize_optimizer + 0: [2023-05-10 12:37:34,425] [INFO] [utils.py:828:see_memory_usage] MA 7.91 GB Max_MA 7.91 GB CA 10.63 GB Max_CA 11 GB + 0: [2023-05-10 12:37:34,426] [INFO] [utils.py:836:see_memory_usage] CPU Virtual Memory: used = 39.93 GB, percent = 7.9% + 0: [2023-05-10 12:37:34,534] [INFO] [utils.py:827:see_memory_usage] end initialize_optimizer + 0: [2023-05-10 12:37:34,535] [INFO] [utils.py:828:see_memory_usage] MA 7.99 GB Max_MA 7.99 GB CA 10.63 GB Max_CA 11 GB + 0: [2023-05-10 12:37:34,535] [INFO] [utils.py:836:see_memory_usage] CPU Virtual Memory: used = 39.93 GB, percent = 7.9% + 0: [2023-05-10 12:37:34,636] [INFO] [utils.py:827:see_memory_usage] end bf16_optimizer + 0: [2023-05-10 12:37:34,637] [INFO] [utils.py:828:see_memory_usage] MA 7.99 GB Max_MA 7.99 GB CA 10.63 GB Max_CA 11 GB + 0: [2023-05-10 12:37:34,637] [INFO] [utils.py:836:see_memory_usage] CPU Virtual Memory: used = 39.93 GB, percent = 7.9% + 0: [2023-05-10 12:37:34,637] [INFO] [logging.py:68:log_dist] [Rank 0] DeepSpeed Final Optimizer = FusedAdam + 0: [2023-05-10 12:37:34,637] [INFO] [logging.py:68:log_dist] [Rank 0] DeepSpeed using client LR scheduler + 0: [2023-05-10 12:37:34,637] [INFO] [logging.py:68:log_dist] [Rank 0] DeepSpeed LR Scheduler = + 0: [2023-05-10 12:37:34,637] [INFO] [logging.py:68:log_dist] [Rank 0] step=0, skipped=0, lr=[0.0002, 0.0002, 0.0002], mom=[(0.9, 0.999), (0.9, 0.999), (0.9, 0.999)] + 0: [2023-05-10 12:37:34,638] [INFO] [config.py:1007:print] DeepSpeedEngine configuration: + 0: [2023-05-10 12:37:34,638] [INFO] [config.py:1011:print] activation_checkpointing_config { + 0: "partition_activations": false, + 0: "contiguous_memory_optimization": false, + 0: "cpu_checkpointing": false, + 0: "number_checkpoints": null, + 0: "synchronize_checkpoint_boundary": false, + 0: "profile": false + 0: } + 0: [2023-05-10 12:37:34,638] [INFO] [config.py:1011:print] aio_config ................... {'block_size': 1048576, 'queue_depth': 8, 'thread_count': 1, 'single_submit': False, 'overlap_events': True} + 0: [2023-05-10 12:37:34,638] [INFO] [config.py:1011:print] amp_enabled .................. False + 0: [2023-05-10 12:37:34,638] [INFO] [config.py:1011:print] amp_params ................... False + 0: [2023-05-10 12:37:34,638] [INFO] [config.py:1011:print] autotuning_config ............ { + 0: "enabled": false, + 0: "start_step": null, + 0: "end_step": null, + 0: "metric_path": null, + 0: "arg_mappings": null, + 0: "metric": "throughput", + 0: "model_info": null, + 0: "results_dir": "/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/autotuning_results", + 0: "exps_dir": "/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/autotuning_exps", + 0: "overwrite": true, + 0: "fast": true, + 0: "start_profile_step": 3, + 0: "end_profile_step": 5, + 0: "tuner_type": "gridsearch", + 0: "tuner_early_stopping": 5, + 0: "tuner_num_trials": 50, + 0: "model_info_path": null, + 0: "mp_size": 1, + 0: "max_train_batch_size": null, + 0: "min_train_batch_size": 1, + 0: "max_train_micro_batch_size_per_gpu": 1.024000e+03, + 0: "min_train_micro_batch_size_per_gpu": 1, + 0: "num_tuning_micro_batch_sizes": 3 + 0: } + 0: [2023-05-10 12:37:34,639] [INFO] [config.py:1011:print] bfloat16_enabled ............. True + 0: [2023-05-10 12:37:34,639] [INFO] [config.py:1011:print] checkpoint_parallel_write_pipeline False + 0: [2023-05-10 12:37:34,639] [INFO] [config.py:1011:print] checkpoint_tag_validation_enabled True + 0: [2023-05-10 12:37:34,639] [INFO] [config.py:1011:print] checkpoint_tag_validation_fail False + 0: [2023-05-10 12:37:34,639] [INFO] [config.py:1011:print] comms_config ................. + 0: [2023-05-10 12:37:34,639] [INFO] [config.py:1011:print] communication_data_type ...... None + 0: [2023-05-10 12:37:34,639] [INFO] [config.py:1011:print] compression_config ........... {'weight_quantization': {'shared_parameters': {'enabled': False, 'quantizer_kernel': False, 'schedule_offset': 0, 'quantize_groups': 1, 'quantize_verbose': False, 'quantization_type': 'symmetric', 'quantize_weight_in_forward': False, 'rounding': 'nearest', 'fp16_mixed_quantize': False, 'quantize_change_ratio': 0.001}, 'different_groups': {}}, 'activation_quantization': {'shared_parameters': {'enabled': False, 'quantization_type': 'symmetric', 'range_calibration': 'dynamic', 'schedule_offset': 1000}, 'different_groups': {}}, 'sparse_pruning': {'shared_parameters': {'enabled': False, 'method': 'l1', 'schedule_offset': 1000}, 'different_groups': {}}, 'row_pruning': {'shared_parameters': {'enabled': False, 'method': 'l1', 'schedule_offset': 1000}, 'different_groups': {}}, 'head_pruning': {'shared_parameters': {'enabled': False, 'method': 'topk', 'schedule_offset': 1000}, 'different_groups': {}}, 'channel_pruning': {'shared_pa + 0: rameters': {'enabled': False, 'method': 'l1', 'schedule_offset': 1000}, 'different_groups': {}}, 'layer_reduction': {'enabled': False}} + 0: [2023-05-10 12:37:34,639] [INFO] [config.py:1011:print] curriculum_enabled ........... False + 0: [2023-05-10 12:37:34,639] [INFO] [config.py:1011:print] curriculum_params ............ False + 0: [2023-05-10 12:37:34,639] [INFO] [config.py:1011:print] dataloader_drop_last ......... False + 0: [2023-05-10 12:37:34,639] [INFO] [config.py:1011:print] disable_allgather ............ False + 0: [2023-05-10 12:37:34,639] [INFO] [config.py:1011:print] dump_state ................... False + 0: [2023-05-10 12:37:34,639] [INFO] [config.py:1011:print] dynamic_loss_scale_args ...... None + 0: [2023-05-10 12:37:34,639] [INFO] [config.py:1011:print] eigenvalue_enabled ........... False + 0: [2023-05-10 12:37:34,639] [INFO] [config.py:1011:print] eigenvalue_gas_boundary_resolution 1 + 0: [2023-05-10 12:37:34,639] [INFO] [config.py:1011:print] eigenvalue_layer_name ........ bert.encoder.layer + 0: [2023-05-10 12:37:34,639] [INFO] [config.py:1011:print] eigenvalue_layer_num ......... 0 + 0: [2023-05-10 12:37:34,639] [INFO] [config.py:1011:print] eigenvalue_max_iter .......... 100 + 0: [2023-05-10 12:37:34,639] [INFO] [config.py:1011:print] eigenvalue_stability ......... 1e-06 + 0: [2023-05-10 12:37:34,639] [INFO] [config.py:1011:print] eigenvalue_tol ............... 0.01 + 0: [2023-05-10 12:37:34,639] [INFO] [config.py:1011:print] eigenvalue_verbose ........... False + 0: [2023-05-10 12:37:34,639] [INFO] [config.py:1011:print] elasticity_enabled ........... False + 0: [2023-05-10 12:37:34,639] [INFO] [config.py:1011:print] flops_profiler_config ........ { + 0: "enabled": false, + 0: "profile_step": 1, + 0: "module_depth": -1, + 0: "top_modules": 1, + 0: "detailed": true, + 0: "output_file": null + 0: } + 0: [2023-05-10 12:37:34,639] [INFO] [config.py:1011:print] fp16_auto_cast ............... None + 0: [2023-05-10 12:37:34,639] [INFO] [config.py:1011:print] fp16_enabled ................. False + 0: [2023-05-10 12:37:34,639] [INFO] [config.py:1011:print] fp16_master_weights_and_gradients False + 0: [2023-05-10 12:37:34,639] [INFO] [config.py:1011:print] global_rank .................. 0 + 0: [2023-05-10 12:37:34,639] [INFO] [config.py:1011:print] gradient_accumulation_steps .. 4 + 0: [2023-05-10 12:37:34,639] [INFO] [config.py:1011:print] gradient_clipping ............ 1.0 + 0: [2023-05-10 12:37:34,639] [INFO] [config.py:1011:print] gradient_predivide_factor .... 1.0 + 0: [2023-05-10 12:37:34,639] [INFO] [config.py:1011:print] initial_dynamic_scale ........ 1 + 0: [2023-05-10 12:37:34,639] [INFO] [config.py:1011:print] load_universal_checkpoint .... False + 0: [2023-05-10 12:37:34,639] [INFO] [config.py:1011:print] loss_scale ................... 1.0 + 0: [2023-05-10 12:37:34,639] [INFO] [config.py:1011:print] memory_breakdown ............. False + 0: [2023-05-10 12:37:34,639] [INFO] [config.py:1011:print] monitor_config ............... + 0: [2023-05-10 12:37:34,639] [INFO] [config.py:1011:print] nebula_config ................ { + 0: "enabled": false, + 0: "persistent_storage_path": null, + 0: "persistent_time_interval": 100, + 0: "num_of_version_in_retention": 2, + 0: "enable_nebula_load": true, + 0: "load_path": null + 0: } + 0: [2023-05-10 12:37:34,639] [INFO] [config.py:1011:print] optimizer_legacy_fusion ...... False + 0: [2023-05-10 12:37:34,639] [INFO] [config.py:1011:print] optimizer_name ............... None + 0: [2023-05-10 12:37:34,639] [INFO] [config.py:1011:print] optimizer_params ............. None + 0: [2023-05-10 12:37:34,639] [INFO] [config.py:1011:print] pipeline ..................... {'stages': 'auto', 'partition': 'best', 'seed_layers': False, 'activation_checkpoint_interval': 0} + 0: [2023-05-10 12:37:34,639] [INFO] [config.py:1011:print] pld_enabled .................. False + 0: [2023-05-10 12:37:34,639] [INFO] [config.py:1011:print] pld_params ................... False + 0: [2023-05-10 12:37:34,640] [INFO] [config.py:1011:print] prescale_gradients ........... False + 0: [2023-05-10 12:37:34,640] [INFO] [config.py:1011:print] scheduler_name ............... None + 0: [2023-05-10 12:37:34,640] [INFO] [config.py:1011:print] scheduler_params ............. None + 0: [2023-05-10 12:37:34,640] [INFO] [config.py:1011:print] sparse_attention ............. None + 0: [2023-05-10 12:37:34,640] [INFO] [config.py:1011:print] sparse_gradients_enabled ..... False + 0: [2023-05-10 12:37:34,640] [INFO] [config.py:1011:print] steps_per_print .............. 2000 + 0: [2023-05-10 12:37:34,640] [INFO] [config.py:1011:print] train_batch_size ............. 1024 + 0: [2023-05-10 12:37:34,640] [INFO] [config.py:1011:print] train_micro_batch_size_per_gpu 2 + 0: [2023-05-10 12:37:34,640] [INFO] [config.py:1011:print] use_node_local_storage ....... False + 0: [2023-05-10 12:37:34,640] [INFO] [config.py:1011:print] wall_clock_breakdown ......... False + 0: [2023-05-10 12:37:34,640] [INFO] [config.py:1011:print] world_size ................... 128 + 0: [2023-05-10 12:37:34,640] [INFO] [config.py:1011:print] zero_allow_untested_optimizer False + 0: [2023-05-10 12:37:34,640] [INFO] [config.py:1011:print] zero_config .................. stage=0 contiguous_gradients=True reduce_scatter=True reduce_bucket_size=500000000 allgather_partitions=True allgather_bucket_size=500000000 overlap_comm=False load_from_fp32_weights=True elastic_checkpoint=False offload_param=None offload_optimizer=None sub_group_size=1000000000 cpu_offload_param=None cpu_offload_use_pin_memory=None cpu_offload=None prefetch_bucket_size=50000000 param_persistence_threshold=100000 model_persistence_threshold=9223372036854775807 max_live_parameters=1000000000 max_reuse_distance=1000000000 gather_16bit_weights_on_model_save=False stage3_gather_fp16_weights_on_model_save=False ignore_unused_parameters=True legacy_stage1=False round_robin_gradients=False + 0: [2023-05-10 12:37:34,640] [INFO] [config.py:1011:print] zero_enabled ................. False + 0: [2023-05-10 12:37:34,640] [INFO] [config.py:1011:print] zero_optimization_stage ...... 0 + 0: [2023-05-10 12:37:34,640] [INFO] [config.py:996:print_user_config] json = { + 0: "train_micro_batch_size_per_gpu": 2, + 0: "train_batch_size": 1.024000e+03, + 0: "gradient_clipping": 1.0, + 0: "zero_optimization": { + 0: "stage": 0 + 0: }, + 0: "bf16": { + 0: "enabled": true + 0: }, + 0: "steps_per_print": 2.000000e+03, + 0: "wall_clock_breakdown": false + 0: } + 0: Time to load utils op: 0.0003867149353027344 seconds + 0: [2023-05-10 12:37:34,640] [INFO] [engine.py:87:__init__] CONFIG: micro_batches=4 micro_batch_size=2 + 0: [2023-05-10 12:37:34,825] [INFO] [engine.py:145:__init__] RANK=0 STAGE=0 LAYERS=41 [0, 41) STAGE_PARAMS=1407562240 (1407.562M) TOTAL_PARAMS=2815124480 (2815.124M) UNIQUE_PARAMS=2815124480 (2815.124M) + 0: [2023-05-10 12:37:34,825] [INFO] [engine.py:145:__init__] RANK=1 STAGE=0 LAYERS=41 [0, 41) STAGE_PARAMS=1407562240 (1407.562M) TOTAL_PARAMS=2815124480 (2815.124M) UNIQUE_PARAMS=2815124480 (2815.124M) +30: [2023-05-10 12:37:36,803] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +30: [2023-05-10 12:37:36,803] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +30: [2023-05-10 12:37:36,803] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +30: [2023-05-10 12:37:36,803] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +30: [2023-05-10 12:37:36,803] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +30: [2023-05-10 12:37:36,803] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +30: [2023-05-10 12:37:36,803] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +30: [2023-05-10 12:37:36,803] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +28: [2023-05-10 12:37:36,803] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +28: [2023-05-10 12:37:36,803] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +28: [2023-05-10 12:37:36,803] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +28: [2023-05-10 12:37:36,803] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +28: [2023-05-10 12:37:36,803] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +28: [2023-05-10 12:37:36,803] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +28: [2023-05-10 12:37:36,804] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +28: [2023-05-10 12:37:36,804] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +29: [2023-05-10 12:37:36,804] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +29: [2023-05-10 12:37:36,804] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +29: [2023-05-10 12:37:36,804] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +29: [2023-05-10 12:37:36,804] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +29: [2023-05-10 12:37:36,804] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +29: [2023-05-10 12:37:36,804] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +29: [2023-05-10 12:37:36,804] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +29: [2023-05-10 12:37:36,804] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +23: [2023-05-10 12:37:36,804] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +23: [2023-05-10 12:37:36,804] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +23: [2023-05-10 12:37:36,804] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +23: [2023-05-10 12:37:36,804] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +23: [2023-05-10 12:37:36,804] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +23: [2023-05-10 12:37:36,804] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +16: [2023-05-10 12:37:36,804] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +16: [2023-05-10 12:37:36,804] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +16: [2023-05-10 12:37:36,804] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +16: [2023-05-10 12:37:36,804] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +16: [2023-05-10 12:37:36,804] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +16: [2023-05-10 12:37:36,804] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +16: [2023-05-10 12:37:36,804] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +23: [2023-05-10 12:37:36,805] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +17: [2023-05-10 12:37:36,805] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... + 8: [2023-05-10 12:37:36,805] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +14: [2023-05-10 12:37:36,805] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +27: [2023-05-10 12:37:36,805] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... + 8: [2023-05-10 12:37:36,805] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... + 8: [2023-05-10 12:37:36,805] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... + 8: [2023-05-10 12:37:36,805] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +14: [2023-05-10 12:37:36,805] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +14: [2023-05-10 12:37:36,805] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +14: [2023-05-10 12:37:36,805] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +14: [2023-05-10 12:37:36,805] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +17: [2023-05-10 12:37:36,805] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +17: [2023-05-10 12:37:36,805] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +17: [2023-05-10 12:37:36,805] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +17: [2023-05-10 12:37:36,805] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +17: [2023-05-10 12:37:36,805] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +14: [2023-05-10 12:37:36,805] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +27: [2023-05-10 12:37:36,805] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +27: [2023-05-10 12:37:36,805] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +27: [2023-05-10 12:37:36,805] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +27: [2023-05-10 12:37:36,805] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +27: [2023-05-10 12:37:36,805] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... + 8: [2023-05-10 12:37:36,805] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... + 8: [2023-05-10 12:37:36,805] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +14: [2023-05-10 12:37:36,805] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +17: [2023-05-10 12:37:36,805] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +27: [2023-05-10 12:37:36,805] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... + 8: [2023-05-10 12:37:36,805] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +19: [2023-05-10 12:37:36,805] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +24: [2023-05-10 12:37:36,805] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +24: [2023-05-10 12:37:36,805] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +24: [2023-05-10 12:37:36,805] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +24: [2023-05-10 12:37:36,805] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +24: [2023-05-10 12:37:36,805] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +23: [2023-05-10 12:37:36,805] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +24: [2023-05-10 12:37:36,805] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +24: [2023-05-10 12:37:36,805] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... + 8: [2023-05-10 12:37:36,805] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +14: [2023-05-10 12:37:36,805] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +27: [2023-05-10 12:37:36,805] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +22: [2023-05-10 12:37:36,805] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +17: [2023-05-10 12:37:36,805] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +16: [2023-05-10 12:37:36,805] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +18: [2023-05-10 12:37:36,805] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +19: [2023-05-10 12:37:36,805] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +11: [2023-05-10 12:37:36,805] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +22: [2023-05-10 12:37:36,805] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +22: [2023-05-10 12:37:36,805] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +22: [2023-05-10 12:37:36,805] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +19: [2023-05-10 12:37:36,805] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +19: [2023-05-10 12:37:36,805] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +19: [2023-05-10 12:37:36,805] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +19: [2023-05-10 12:37:36,805] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +21: [2023-05-10 12:37:36,805] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +21: [2023-05-10 12:37:36,805] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +21: [2023-05-10 12:37:36,805] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +19: [2023-05-10 12:37:36,805] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +11: [2023-05-10 12:37:36,805] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +11: [2023-05-10 12:37:36,805] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +11: [2023-05-10 12:37:36,805] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +11: [2023-05-10 12:37:36,805] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +11: [2023-05-10 12:37:36,805] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +18: [2023-05-10 12:37:36,805] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +18: [2023-05-10 12:37:36,805] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +18: [2023-05-10 12:37:36,805] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +22: [2023-05-10 12:37:36,805] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +22: [2023-05-10 12:37:36,805] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +21: [2023-05-10 12:37:36,805] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +21: [2023-05-10 12:37:36,805] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +18: [2023-05-10 12:37:36,805] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +18: [2023-05-10 12:37:36,805] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +21: [2023-05-10 12:37:36,806] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +11: [2023-05-10 12:37:36,805] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +22: [2023-05-10 12:37:36,805] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +21: [2023-05-10 12:37:36,806] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +24: [2023-05-10 12:37:36,806] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +15: [2023-05-10 12:37:36,806] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +18: [2023-05-10 12:37:36,806] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +15: [2023-05-10 12:37:36,806] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +10: [2023-05-10 12:37:36,806] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... + 2: [2023-05-10 12:37:36,806] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +25: [2023-05-10 12:37:36,806] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... + 3: [2023-05-10 12:37:36,806] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... + 2: [2023-05-10 12:37:36,806] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... + 2: [2023-05-10 12:37:36,806] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +10: [2023-05-10 12:37:36,806] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +10: [2023-05-10 12:37:36,806] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +15: [2023-05-10 12:37:36,806] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +15: [2023-05-10 12:37:36,806] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +15: [2023-05-10 12:37:36,806] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +10: [2023-05-10 12:37:36,806] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... + 2: [2023-05-10 12:37:36,806] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... + 2: [2023-05-10 12:37:36,806] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... + 2: [2023-05-10 12:37:36,806] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... + 2: [2023-05-10 12:37:36,806] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +25: [2023-05-10 12:37:36,806] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +25: [2023-05-10 12:37:36,806] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +25: [2023-05-10 12:37:36,806] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +25: [2023-05-10 12:37:36,806] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... + 3: [2023-05-10 12:37:36,806] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... + 3: [2023-05-10 12:37:36,806] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... + 3: [2023-05-10 12:37:36,806] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... + 3: [2023-05-10 12:37:36,806] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... + 3: [2023-05-10 12:37:36,806] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... + 2: [2023-05-10 12:37:36,806] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +15: [2023-05-10 12:37:36,806] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +15: [2023-05-10 12:37:36,806] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +20: [2023-05-10 12:37:36,806] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +20: [2023-05-10 12:37:36,806] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +20: [2023-05-10 12:37:36,806] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +20: [2023-05-10 12:37:36,806] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +25: [2023-05-10 12:37:36,806] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +25: [2023-05-10 12:37:36,806] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... + 3: [2023-05-10 12:37:36,806] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +20: [2023-05-10 12:37:36,806] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +20: [2023-05-10 12:37:36,806] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +10: [2023-05-10 12:37:36,806] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +10: [2023-05-10 12:37:36,806] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +10: [2023-05-10 12:37:36,806] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +20: [2023-05-10 12:37:36,806] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +21: [2023-05-10 12:37:36,806] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +20: [2023-05-10 12:37:36,806] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +26: [2023-05-10 12:37:36,806] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +26: [2023-05-10 12:37:36,806] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +26: [2023-05-10 12:37:36,806] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +26: [2023-05-10 12:37:36,806] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... + 6: [2023-05-10 12:37:36,806] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +22: [2023-05-10 12:37:36,806] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +18: [2023-05-10 12:37:36,806] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +26: [2023-05-10 12:37:36,806] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +26: [2023-05-10 12:37:36,806] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +11: [2023-05-10 12:37:36,806] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +19: [2023-05-10 12:37:36,806] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +26: [2023-05-10 12:37:36,806] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... + 6: [2023-05-10 12:37:36,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... + 6: [2023-05-10 12:37:36,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... + 6: [2023-05-10 12:37:36,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... + 6: [2023-05-10 12:37:36,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... + 6: [2023-05-10 12:37:36,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +13: [2023-05-10 12:37:36,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... + 6: [2023-05-10 12:37:36,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +13: [2023-05-10 12:37:36,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... + 4: [2023-05-10 12:37:36,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... + 4: [2023-05-10 12:37:36,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... + 4: [2023-05-10 12:37:36,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... + 4: [2023-05-10 12:37:36,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... + 4: [2023-05-10 12:37:36,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... + 4: [2023-05-10 12:37:36,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +13: [2023-05-10 12:37:36,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... + 4: [2023-05-10 12:37:36,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... + 7: [2023-05-10 12:37:36,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... + 7: [2023-05-10 12:37:36,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +13: [2023-05-10 12:37:36,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +13: [2023-05-10 12:37:36,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... + 4: [2023-05-10 12:37:36,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +13: [2023-05-10 12:37:36,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... + 7: [2023-05-10 12:37:36,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +10: [2023-05-10 12:37:36,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... + 3: [2023-05-10 12:37:36,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... + 7: [2023-05-10 12:37:36,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +13: [2023-05-10 12:37:36,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +15: [2023-05-10 12:37:36,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... + 7: [2023-05-10 12:37:36,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... + 7: [2023-05-10 12:37:36,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... + 7: [2023-05-10 12:37:36,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... + 0: [2023-05-10 12:37:36,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... + 1: [2023-05-10 12:37:36,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... + 9: [2023-05-10 12:37:36,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... + 9: [2023-05-10 12:37:36,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... + 0: [2023-05-10 12:37:36,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... + 9: [2023-05-10 12:37:36,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... + 9: [2023-05-10 12:37:36,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +12: [2023-05-10 12:37:36,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +12: [2023-05-10 12:37:36,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +12: [2023-05-10 12:37:36,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +12: [2023-05-10 12:37:36,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +12: [2023-05-10 12:37:36,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... + 6: [2023-05-10 12:37:36,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +13: [2023-05-10 12:37:36,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +25: [2023-05-10 12:37:36,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... + 1: [2023-05-10 12:37:36,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +12: [2023-05-10 12:37:36,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +12: [2023-05-10 12:37:36,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... + 0: [2023-05-10 12:37:36,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... + 1: [2023-05-10 12:37:36,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... + 1: [2023-05-10 12:37:36,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... + 1: [2023-05-10 12:37:36,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... + 7: [2023-05-10 12:37:36,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... + 1: [2023-05-10 12:37:36,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... + 1: [2023-05-10 12:37:36,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +12: [2023-05-10 12:37:36,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... + 9: [2023-05-10 12:37:36,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +26: [2023-05-10 12:37:36,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... + 0: [2023-05-10 12:37:36,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... + 0: [2023-05-10 12:37:36,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... + 0: [2023-05-10 12:37:36,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... + 0: [2023-05-10 12:37:36,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... + 0: [2023-05-10 12:37:36,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +31: [2023-05-10 12:37:36,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... + 1: [2023-05-10 12:37:36,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... + 9: [2023-05-10 12:37:36,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... + 9: [2023-05-10 12:37:36,808] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... + 5: [2023-05-10 12:37:36,808] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... + 5: [2023-05-10 12:37:36,808] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... + 5: [2023-05-10 12:37:36,808] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... + 5: [2023-05-10 12:37:36,808] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... + 5: [2023-05-10 12:37:36,808] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... + 9: [2023-05-10 12:37:36,808] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... + 5: [2023-05-10 12:37:36,808] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... + 5: [2023-05-10 12:37:36,808] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... + 5: [2023-05-10 12:37:36,808] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +31: [2023-05-10 12:37:36,808] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +31: [2023-05-10 12:37:36,808] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +31: [2023-05-10 12:37:36,808] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +31: [2023-05-10 12:37:36,808] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +31: [2023-05-10 12:37:36,808] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +31: [2023-05-10 12:37:36,808] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +31: [2023-05-10 12:37:36,809] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +21: [2023-05-10 12:37:37,013] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +21: [2023-05-10 12:37:37,013] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +21: [2023-05-10 12:37:37,013] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +21: [2023-05-10 12:37:37,013] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +21: [2023-05-10 12:37:37,013] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +21: [2023-05-10 12:37:37,013] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +21: [2023-05-10 12:37:37,013] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +21: [2023-05-10 12:37:37,013] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +21: [2023-05-10 12:37:37,013] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +21: [2023-05-10 12:37:37,013] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +21: [2023-05-10 12:37:37,014] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +21: [2023-05-10 12:37:37,013] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +21: [2023-05-10 12:37:37,014] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt... +21: [2023-05-10 12:37:37,014] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt... +21: [2023-05-10 12:37:37,014] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt... +21: [2023-05-10 12:37:37,014] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt... +21: [2023-05-10 12:37:37,015] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +21: [2023-05-10 12:37:37,015] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. + 3: [2023-05-10 12:37:37,015] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. + 3: [2023-05-10 12:37:37,015] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. + 3: [2023-05-10 12:37:37,015] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. + 3: [2023-05-10 12:37:37,015] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. + 3: [2023-05-10 12:37:37,015] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +21: [2023-05-10 12:37:37,015] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +18: [2023-05-10 12:37:37,015] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +18: [2023-05-10 12:37:37,015] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. + 3: [2023-05-10 12:37:37,015] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. + 3: [2023-05-10 12:37:37,015] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. + 2: [2023-05-10 12:37:37,015] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. + 2: [2023-05-10 12:37:37,015] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +21: [2023-05-10 12:37:37,015] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. + 3: [2023-05-10 12:37:37,015] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... + 3: [2023-05-10 12:37:37,015] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... + 3: [2023-05-10 12:37:37,015] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +14: [2023-05-10 12:37:37,015] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +14: [2023-05-10 12:37:37,015] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +14: [2023-05-10 12:37:37,015] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +14: [2023-05-10 12:37:37,015] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +14: [2023-05-10 12:37:37,015] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +14: [2023-05-10 12:37:37,015] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +14: [2023-05-10 12:37:37,015] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +26: [2023-05-10 12:37:37,015] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +26: [2023-05-10 12:37:37,015] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +26: [2023-05-10 12:37:37,015] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +26: [2023-05-10 12:37:37,015] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +26: [2023-05-10 12:37:37,015] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +14: [2023-05-10 12:37:37,015] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +14: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... + 3: [2023-05-10 12:37:37,015] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... + 3: [2023-05-10 12:37:37,015] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. + 2: [2023-05-10 12:37:37,015] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. + 2: [2023-05-10 12:37:37,015] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. + 2: [2023-05-10 12:37:37,015] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. + 2: [2023-05-10 12:37:37,015] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... + 2: [2023-05-10 12:37:37,015] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +14: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +26: [2023-05-10 12:37:37,015] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +26: [2023-05-10 12:37:37,015] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. + 2: [2023-05-10 12:37:37,015] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... + 2: [2023-05-10 12:37:37,015] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. + 3: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt... + 2: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +14: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +21: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +30: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +30: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +30: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +30: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +30: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +26: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... + 2: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +30: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +30: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. + 3: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt... +21: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +30: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +30: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +30: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +30: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... + 3: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt... +14: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +26: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +18: [2023-05-10 12:37:37,015] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +18: [2023-05-10 12:37:37,015] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +18: [2023-05-10 12:37:37,015] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +18: [2023-05-10 12:37:37,015] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +18: [2023-05-10 12:37:37,015] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. + 7: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. + 7: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. + 7: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. + 7: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. + 7: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +10: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +10: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +10: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +10: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +10: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. + 2: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +21: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +21: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +30: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +26: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +31: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +31: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +31: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +31: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +31: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +18: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +18: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +18: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... + 7: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. + 7: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +10: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +10: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. + 3: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt... +26: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +31: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +10: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +10: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +10: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... + 9: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. + 9: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +15: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +15: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +15: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +15: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +15: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +26: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +31: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +15: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +15: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +10: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. + 2: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt... +15: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +15: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +15: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +16: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +16: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +16: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +16: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +16: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. + 2: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt... +16: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +16: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. + 2: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt... +15: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +20: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. + 4: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. + 4: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. + 4: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. + 7: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. + 7: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... + 7: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... + 7: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +16: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... + 2: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt... +14: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt... +20: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +20: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +20: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +30: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt... +30: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt... +30: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt... +31: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +31: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +31: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +31: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +15: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +22: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +22: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +22: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +22: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +22: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +20: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +20: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +20: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +26: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt... +26: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt... +26: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt... +26: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt... +17: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +17: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +17: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +17: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +17: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +18: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. + 4: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. + 4: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. + 4: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. + 4: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +10: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +16: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +16: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +14: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt... +22: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +22: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +20: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +20: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +30: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt... +17: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +16: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +22: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +31: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +17: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +18: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... + 4: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +14: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt... +20: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +20: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +22: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +22: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +20: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +16: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +29: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +29: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +29: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +29: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +29: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +14: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt... +24: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +24: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +24: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +24: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +24: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. + 7: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +22: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. + 6: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. + 6: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. + 6: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. + 6: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. + 6: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +29: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +24: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +17: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +17: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +18: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt... + 4: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... + 4: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... + 4: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... + 4: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +29: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +24: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +12: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +12: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +12: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +12: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +12: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +10: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt... +10: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt... + 6: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. + 6: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +29: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +29: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +17: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +17: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +18: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt... +10: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt... +22: [2023-05-10 12:37:37,017] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +12: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +12: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +18: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt... +29: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +15: [2023-05-10 12:37:37,017] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt... +15: [2023-05-10 12:37:37,017] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt... +15: [2023-05-10 12:37:37,017] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt... +24: [2023-05-10 12:37:37,017] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +24: [2023-05-10 12:37:37,017] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +24: [2023-05-10 12:37:37,017] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +10: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt... +23: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +23: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +23: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +23: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +23: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +27: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. + 1: [2023-05-10 12:37:37,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. + 1: [2023-05-10 12:37:37,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. + 1: [2023-05-10 12:37:37,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. + 1: [2023-05-10 12:37:37,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. + 1: [2023-05-10 12:37:37,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +15: [2023-05-10 12:37:37,017] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt... +17: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +18: [2023-05-10 12:37:37,017] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt... +23: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +27: [2023-05-10 12:37:37,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +27: [2023-05-10 12:37:37,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +27: [2023-05-10 12:37:37,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +27: [2023-05-10 12:37:37,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +27: [2023-05-10 12:37:37,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. + 1: [2023-05-10 12:37:37,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. + 9: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. + 9: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. + 9: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. + 9: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. + 9: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +12: [2023-05-10 12:37:37,017] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +12: [2023-05-10 12:37:37,017] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +12: [2023-05-10 12:37:37,017] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +11: [2023-05-10 12:37:37,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +11: [2023-05-10 12:37:37,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +11: [2023-05-10 12:37:37,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +11: [2023-05-10 12:37:37,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +11: [2023-05-10 12:37:37,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. + 7: [2023-05-10 12:37:37,017] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt... + 7: [2023-05-10 12:37:37,017] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt... + 7: [2023-05-10 12:37:37,017] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt... +23: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +27: [2023-05-10 12:37:37,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. + 6: [2023-05-10 12:37:37,017] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... + 6: [2023-05-10 12:37:37,017] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... + 6: [2023-05-10 12:37:37,017] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... + 6: [2023-05-10 12:37:37,017] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +29: [2023-05-10 12:37:37,017] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +29: [2023-05-10 12:37:37,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. + 1: [2023-05-10 12:37:37,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. + 9: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. + 9: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... + 9: [2023-05-10 12:37:37,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +19: [2023-05-10 12:37:37,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +19: [2023-05-10 12:37:37,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +19: [2023-05-10 12:37:37,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +19: [2023-05-10 12:37:37,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +19: [2023-05-10 12:37:37,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +11: [2023-05-10 12:37:37,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +11: [2023-05-10 12:37:37,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +27: [2023-05-10 12:37:37,017] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... + 1: [2023-05-10 12:37:37,017] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +19: [2023-05-10 12:37:37,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +19: [2023-05-10 12:37:37,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +24: [2023-05-10 12:37:37,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +12: [2023-05-10 12:37:37,017] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... + 7: [2023-05-10 12:37:37,017] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt... +16: [2023-05-10 12:37:37,017] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt... +20: [2023-05-10 12:37:37,017] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt... +20: [2023-05-10 12:37:37,017] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt... +20: [2023-05-10 12:37:37,017] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt... +20: [2023-05-10 12:37:37,017] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt... +19: [2023-05-10 12:37:37,017] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +19: [2023-05-10 12:37:37,017] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +19: [2023-05-10 12:37:37,017] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +19: [2023-05-10 12:37:37,017] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +11: [2023-05-10 12:37:37,017] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +11: [2023-05-10 12:37:37,017] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +11: [2023-05-10 12:37:37,017] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +23: [2023-05-10 12:37:37,017] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +23: [2023-05-10 12:37:37,017] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +23: [2023-05-10 12:37:37,017] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +27: [2023-05-10 12:37:37,017] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +27: [2023-05-10 12:37:37,017] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... + 1: [2023-05-10 12:37:37,017] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... + 1: [2023-05-10 12:37:37,017] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +31: [2023-05-10 12:37:37,017] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt... + 4: [2023-05-10 12:37:37,017] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt... + 4: [2023-05-10 12:37:37,017] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt... + 4: [2023-05-10 12:37:37,017] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt... + 4: [2023-05-10 12:37:37,017] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt... + 6: [2023-05-10 12:37:37,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +16: [2023-05-10 12:37:37,017] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt... +16: [2023-05-10 12:37:37,017] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt... + 1: [2023-05-10 12:37:37,017] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +22: [2023-05-10 12:37:37,017] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt... +22: [2023-05-10 12:37:37,017] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt... +22: [2023-05-10 12:37:37,017] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt... +22: [2023-05-10 12:37:37,017] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt... +12: [2023-05-10 12:37:37,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +11: [2023-05-10 12:37:37,017] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +16: [2023-05-10 12:37:37,017] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt... + 2: [2023-05-10 12:37:37,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +13: [2023-05-10 12:37:37,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +13: [2023-05-10 12:37:37,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +13: [2023-05-10 12:37:37,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +13: [2023-05-10 12:37:37,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +13: [2023-05-10 12:37:37,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +17: [2023-05-10 12:37:37,017] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt... +19: [2023-05-10 12:37:37,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +24: [2023-05-10 12:37:37,017] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +31: [2023-05-10 12:37:37,017] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt... + 9: [2023-05-10 12:37:37,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +31: [2023-05-10 12:37:37,017] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt... +31: [2023-05-10 12:37:37,017] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt... +17: [2023-05-10 12:37:37,017] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt... +17: [2023-05-10 12:37:37,017] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt... +17: [2023-05-10 12:37:37,017] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt... +13: [2023-05-10 12:37:37,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +13: [2023-05-10 12:37:37,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +25: [2023-05-10 12:37:37,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +25: [2023-05-10 12:37:37,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +25: [2023-05-10 12:37:37,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +25: [2023-05-10 12:37:37,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +29: [2023-05-10 12:37:37,017] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt... +29: [2023-05-10 12:37:37,017] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt... +27: [2023-05-10 12:37:37,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. + 2: [2023-05-10 12:37:37,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +30: [2023-05-10 12:37:37,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +25: [2023-05-10 12:37:37,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +25: [2023-05-10 12:37:37,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +25: [2023-05-10 12:37:37,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +29: [2023-05-10 12:37:37,017] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt... + 9: [2023-05-10 12:37:37,017] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +29: [2023-05-10 12:37:37,017] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt... +11: [2023-05-10 12:37:37,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +27: [2023-05-10 12:37:37,017] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +25: [2023-05-10 12:37:37,017] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... + 2: [2023-05-10 12:37:37,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +25: [2023-05-10 12:37:37,017] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +25: [2023-05-10 12:37:37,017] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +25: [2023-05-10 12:37:37,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +25: [2023-05-10 12:37:37,017] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +23: [2023-05-10 12:37:37,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +13: [2023-05-10 12:37:37,017] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +13: [2023-05-10 12:37:37,017] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +13: [2023-05-10 12:37:37,017] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +13: [2023-05-10 12:37:37,017] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... + 1: [2023-05-10 12:37:37,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. + 2: [2023-05-10 12:37:37,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +14: [2023-05-10 12:37:37,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. + 5: [2023-05-10 12:37:37,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. + 5: [2023-05-10 12:37:37,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. + 5: [2023-05-10 12:37:37,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. + 5: [2023-05-10 12:37:37,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. + 5: [2023-05-10 12:37:37,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. + 3: [2023-05-10 12:37:37,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +30: [2023-05-10 12:37:37,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +23: [2023-05-10 12:37:37,017] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... + 5: [2023-05-10 12:37:37,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. + 5: [2023-05-10 12:37:37,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +14: [2023-05-10 12:37:37,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +30: [2023-05-10 12:37:37,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +14: [2023-05-10 12:37:37,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. + 5: [2023-05-10 12:37:37,017] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... + 5: [2023-05-10 12:37:37,017] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... + 5: [2023-05-10 12:37:37,017] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +30: [2023-05-10 12:37:37,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +24: [2023-05-10 12:37:37,017] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt... +24: [2023-05-10 12:37:37,017] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt... +13: [2023-05-10 12:37:37,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. + 1: [2023-05-10 12:37:37,018] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt... + 1: [2023-05-10 12:37:37,018] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt... + 1: [2023-05-10 12:37:37,018] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt... + 1: [2023-05-10 12:37:37,018] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt... + 2: [2023-05-10 12:37:37,017] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +10: [2023-05-10 12:37:37,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +14: [2023-05-10 12:37:37,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +15: [2023-05-10 12:37:37,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +24: [2023-05-10 12:37:37,017] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt... +24: [2023-05-10 12:37:37,017] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt... +27: [2023-05-10 12:37:37,018] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt... +27: [2023-05-10 12:37:37,018] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt... +27: [2023-05-10 12:37:37,018] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt... + 2: [2023-05-10 12:37:37,018] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +11: [2023-05-10 12:37:37,018] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt... +13: [2023-05-10 12:37:37,018] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt... +18: [2023-05-10 12:37:37,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +23: [2023-05-10 12:37:37,018] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt... +23: [2023-05-10 12:37:37,018] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt... +27: [2023-05-10 12:37:37,018] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt... +13: [2023-05-10 12:37:37,018] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt... +13: [2023-05-10 12:37:37,018] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt... +15: [2023-05-10 12:37:37,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +11: [2023-05-10 12:37:37,018] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt... +11: [2023-05-10 12:37:37,018] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt... + 3: [2023-05-10 12:37:37,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +30: [2023-05-10 12:37:37,018] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +11: [2023-05-10 12:37:37,018] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt... +16: [2023-05-10 12:37:37,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. + 2: [2023-05-10 12:37:37,018] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +13: [2023-05-10 12:37:37,018] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt... + 6: [2023-05-10 12:37:37,018] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt... + 6: [2023-05-10 12:37:37,018] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt... + 6: [2023-05-10 12:37:37,018] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt... +22: [2023-05-10 12:37:37,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +26: [2023-05-10 12:37:37,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +10: [2023-05-10 12:37:37,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +10: [2023-05-10 12:37:37,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. + 6: [2023-05-10 12:37:37,018] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt... + 3: [2023-05-10 12:37:37,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +23: [2023-05-10 12:37:37,018] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt... +23: [2023-05-10 12:37:37,018] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt... +19: [2023-05-10 12:37:37,018] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt... + 9: [2023-05-10 12:37:37,018] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt... + 9: [2023-05-10 12:37:37,018] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt... + 9: [2023-05-10 12:37:37,018] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt... + 9: [2023-05-10 12:37:37,018] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt... +30: [2023-05-10 12:37:37,018] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... + 3: [2023-05-10 12:37:37,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +22: [2023-05-10 12:37:37,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +19: [2023-05-10 12:37:37,018] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt... +19: [2023-05-10 12:37:37,018] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt... +19: [2023-05-10 12:37:37,018] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt... +12: [2023-05-10 12:37:37,018] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt... +12: [2023-05-10 12:37:37,018] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt... +12: [2023-05-10 12:37:37,018] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt... +12: [2023-05-10 12:37:37,018] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt... + 2: [2023-05-10 12:37:37,018] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +30: [2023-05-10 12:37:37,018] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... + 1: [2023-05-10 12:37:37,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +27: [2023-05-10 12:37:37,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. + 5: [2023-05-10 12:37:37,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. + 6: [2023-05-10 12:37:37,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +22: [2023-05-10 12:37:37,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +25: [2023-05-10 12:37:37,018] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt... +25: [2023-05-10 12:37:37,018] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt... +25: [2023-05-10 12:37:37,018] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt... +25: [2023-05-10 12:37:37,018] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt... +26: [2023-05-10 12:37:37,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +14: [2023-05-10 12:37:37,018] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +14: [2023-05-10 12:37:37,018] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +14: [2023-05-10 12:37:37,018] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... + 5: [2023-05-10 12:37:37,018] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +26: [2023-05-10 12:37:37,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +17: [2023-05-10 12:37:37,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +20: [2023-05-10 12:37:37,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +20: [2023-05-10 12:37:37,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +19: [2023-05-10 12:37:37,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. + 5: [2023-05-10 12:37:37,018] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt... + 5: [2023-05-10 12:37:37,018] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt... + 5: [2023-05-10 12:37:37,018] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt... + 5: [2023-05-10 12:37:37,018] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt... +10: [2023-05-10 12:37:37,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +15: [2023-05-10 12:37:37,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +30: [2023-05-10 12:37:37,018] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +16: [2023-05-10 12:37:37,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +23: [2023-05-10 12:37:37,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. + 3: [2023-05-10 12:37:37,018] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +27: [2023-05-10 12:37:37,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +14: [2023-05-10 12:37:37,018] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +29: [2023-05-10 12:37:37,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +15: [2023-05-10 12:37:37,018] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +20: [2023-05-10 12:37:37,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +16: [2023-05-10 12:37:37,018] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +22: [2023-05-10 12:37:37,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +22: [2023-05-10 12:37:37,019] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +10: [2023-05-10 12:37:37,018] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +19: [2023-05-10 12:37:37,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +23: [2023-05-10 12:37:37,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. + 3: [2023-05-10 12:37:37,019] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... + 6: [2023-05-10 12:37:37,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +15: [2023-05-10 12:37:37,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +26: [2023-05-10 12:37:37,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. + 3: [2023-05-10 12:37:37,019] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +16: [2023-05-10 12:37:37,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +18: [2023-05-10 12:37:37,019] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +22: [2023-05-10 12:37:37,019] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +10: [2023-05-10 12:37:37,019] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +26: [2023-05-10 12:37:37,019] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +18: [2023-05-10 12:37:37,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +27: [2023-05-10 12:37:37,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +27: [2023-05-10 12:37:37,019] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +15: [2023-05-10 12:37:37,019] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +16: [2023-05-10 12:37:37,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +29: [2023-05-10 12:37:37,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. + 1: [2023-05-10 12:37:37,019] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +26: [2023-05-10 12:37:37,019] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +10: [2023-05-10 12:37:37,019] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +22: [2023-05-10 12:37:37,019] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... + 3: [2023-05-10 12:37:37,019] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +19: [2023-05-10 12:37:37,019] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... + 7: [2023-05-10 12:37:37,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. + 9: [2023-05-10 12:37:37,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +15: [2023-05-10 12:37:37,019] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +20: [2023-05-10 12:37:37,019] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +24: [2023-05-10 12:37:37,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +17: [2023-05-10 12:37:37,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. + 6: [2023-05-10 12:37:37,019] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +26: [2023-05-10 12:37:37,019] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +17: [2023-05-10 12:37:37,019] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +10: [2023-05-10 12:37:37,019] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +19: [2023-05-10 12:37:37,019] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +27: [2023-05-10 12:37:37,019] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +20: [2023-05-10 12:37:37,019] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +17: [2023-05-10 12:37:37,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +16: [2023-05-10 12:37:37,019] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +31: [2023-05-10 12:37:37,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +15: [2023-05-10 12:37:37,019] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... + 9: [2023-05-10 12:37:37,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. + 9: [2023-05-10 12:37:37,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. + 7: [2023-05-10 12:37:37,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. + 1: [2023-05-10 12:37:37,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +20: [2023-05-10 12:37:37,019] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +17: [2023-05-10 12:37:37,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +16: [2023-05-10 12:37:37,019] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +19: [2023-05-10 12:37:37,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +18: [2023-05-10 12:37:37,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +18: [2023-05-10 12:37:37,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +27: [2023-05-10 12:37:37,019] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... + 1: [2023-05-10 12:37:37,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +23: [2023-05-10 12:37:37,019] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +29: [2023-05-10 12:37:37,019] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... + 6: [2023-05-10 12:37:37,019] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +16: [2023-05-10 12:37:37,019] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... + 7: [2023-05-10 12:37:37,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +31: [2023-05-10 12:37:37,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +22: [2023-05-10 12:37:37,019] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +29: [2023-05-10 12:37:37,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. + 7: [2023-05-10 12:37:37,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +23: [2023-05-10 12:37:37,019] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +20: [2023-05-10 12:37:37,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +29: [2023-05-10 12:37:37,019] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +23: [2023-05-10 12:37:37,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +27: [2023-05-10 12:37:37,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +13: [2023-05-10 12:37:37,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +26: [2023-05-10 12:37:37,019] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... + 1: [2023-05-10 12:37:37,020] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. + 9: [2023-05-10 12:37:37,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +19: [2023-05-10 12:37:37,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +11: [2023-05-10 12:37:37,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +29: [2023-05-10 12:37:37,020] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +31: [2023-05-10 12:37:37,020] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +12: [2023-05-10 12:37:37,020] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. + 6: [2023-05-10 12:37:37,020] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +18: [2023-05-10 12:37:37,020] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +23: [2023-05-10 12:37:37,020] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +19: [2023-05-10 12:37:37,020] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +31: [2023-05-10 12:37:37,020] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +17: [2023-05-10 12:37:37,020] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... + 6: [2023-05-10 12:37:37,020] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +17: [2023-05-10 12:37:37,020] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... + 1: [2023-05-10 12:37:37,020] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +29: [2023-05-10 12:37:37,020] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... + 5: [2023-05-10 12:37:37,020] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +27: [2023-05-10 12:37:37,020] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... + 9: [2023-05-10 12:37:37,020] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +17: [2023-05-10 12:37:37,020] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +23: [2023-05-10 12:37:37,020] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +19: [2023-05-10 12:37:37,020] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +11: [2023-05-10 12:37:37,020] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. + 1: [2023-05-10 12:37:37,020] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... + 1: [2023-05-10 12:37:37,020] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +20: [2023-05-10 12:37:37,020] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... + 9: [2023-05-10 12:37:37,020] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +29: [2023-05-10 12:37:37,020] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... + 9: [2023-05-10 12:37:37,020] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +11: [2023-05-10 12:37:37,020] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. + 6: [2023-05-10 12:37:37,020] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... + 7: [2023-05-10 12:37:37,020] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +18: [2023-05-10 12:37:37,020] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +18: [2023-05-10 12:37:37,020] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... + 9: [2023-05-10 12:37:37,020] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +24: [2023-05-10 12:37:37,020] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +23: [2023-05-10 12:37:37,020] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... + 7: [2023-05-10 12:37:37,020] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... + 5: [2023-05-10 12:37:37,020] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +24: [2023-05-10 12:37:37,020] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... + 6: [2023-05-10 12:37:37,020] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +13: [2023-05-10 12:37:37,020] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. + 7: [2023-05-10 12:37:37,020] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +12: [2023-05-10 12:37:37,021] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. + 5: [2023-05-10 12:37:37,021] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. + 7: [2023-05-10 12:37:37,021] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +13: [2023-05-10 12:37:37,021] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +31: [2023-05-10 12:37:37,021] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +24: [2023-05-10 12:37:37,021] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +31: [2023-05-10 12:37:37,021] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +11: [2023-05-10 12:37:37,021] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +24: [2023-05-10 12:37:37,021] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +13: [2023-05-10 12:37:37,021] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +12: [2023-05-10 12:37:37,021] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +12: [2023-05-10 12:37:37,021] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +11: [2023-05-10 12:37:37,021] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +12: [2023-05-10 12:37:37,021] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +25: [2023-05-10 12:37:37,021] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +31: [2023-05-10 12:37:37,021] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... + 5: [2023-05-10 12:37:37,021] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +31: [2023-05-10 12:37:37,021] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... + 5: [2023-05-10 12:37:37,021] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +11: [2023-05-10 12:37:37,021] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +25: [2023-05-10 12:37:37,021] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +11: [2023-05-10 12:37:37,021] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +24: [2023-05-10 12:37:37,021] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +13: [2023-05-10 12:37:37,021] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. + 5: [2023-05-10 12:37:37,021] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +25: [2023-05-10 12:37:37,021] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +12: [2023-05-10 12:37:37,021] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +24: [2023-05-10 12:37:37,021] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +13: [2023-05-10 12:37:37,022] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +13: [2023-05-10 12:37:37,022] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +25: [2023-05-10 12:37:37,022] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +24: [2023-05-10 12:37:37,022] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... + 5: [2023-05-10 12:37:37,022] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +12: [2023-05-10 12:37:37,022] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +12: [2023-05-10 12:37:37,022] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... + 5: [2023-05-10 12:37:37,022] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +11: [2023-05-10 12:37:37,022] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +25: [2023-05-10 12:37:37,022] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +25: [2023-05-10 12:37:37,022] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +13: [2023-05-10 12:37:37,022] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +25: [2023-05-10 12:37:37,022] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +25: [2023-05-10 12:37:37,023] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... + 0: [2023-05-10 12:37:37,023] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. + 0: [2023-05-10 12:37:37,023] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. + 0: [2023-05-10 12:37:37,024] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. + 0: [2023-05-10 12:37:37,024] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. + 0: [2023-05-10 12:37:37,024] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. + 0: [2023-05-10 12:37:37,024] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. + 0: [2023-05-10 12:37:37,024] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... + 0: [2023-05-10 12:37:37,024] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... + 0: [2023-05-10 12:37:37,024] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... + 0: [2023-05-10 12:37:37,024] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. + 0: [2023-05-10 12:37:37,024] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. + 0: [2023-05-10 12:37:37,024] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt... + 0: [2023-05-10 12:37:37,024] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt... + 0: [2023-05-10 12:37:37,024] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt... + 0: [2023-05-10 12:37:37,024] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... + 0: [2023-05-10 12:37:37,024] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt... +28: [2023-05-10 12:37:37,024] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +28: [2023-05-10 12:37:37,024] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +28: [2023-05-10 12:37:37,024] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +28: [2023-05-10 12:37:37,024] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +28: [2023-05-10 12:37:37,024] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +28: [2023-05-10 12:37:37,024] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +28: [2023-05-10 12:37:37,024] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +28: [2023-05-10 12:37:37,025] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +28: [2023-05-10 12:37:37,025] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +28: [2023-05-10 12:37:37,025] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +28: [2023-05-10 12:37:37,025] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... +28: [2023-05-10 12:37:37,025] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. + 0: [2023-05-10 12:37:37,025] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. + 0: [2023-05-10 12:37:37,025] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. + 0: [2023-05-10 12:37:37,025] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +28: [2023-05-10 12:37:37,025] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt... +28: [2023-05-10 12:37:37,025] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt... +28: [2023-05-10 12:37:37,025] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt... +28: [2023-05-10 12:37:37,025] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt... + 0: [2023-05-10 12:37:37,026] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. + 0: [2023-05-10 12:37:37,026] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... + 0: [2023-05-10 12:37:37,026] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... + 0: [2023-05-10 12:37:37,026] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... + 0: [2023-05-10 12:37:37,026] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +28: [2023-05-10 12:37:37,027] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +28: [2023-05-10 12:37:37,027] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +28: [2023-05-10 12:37:37,027] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +28: [2023-05-10 12:37:37,027] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. +28: [2023-05-10 12:37:37,028] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +28: [2023-05-10 12:37:37,029] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +28: [2023-05-10 12:37:37,029] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +28: [2023-05-10 12:37:37,029] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... + 8: [2023-05-10 12:37:37,029] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. + 8: [2023-05-10 12:37:37,029] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. + 8: [2023-05-10 12:37:37,029] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. + 8: [2023-05-10 12:37:37,029] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. + 8: [2023-05-10 12:37:37,029] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. + 8: [2023-05-10 12:37:37,029] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. + 8: [2023-05-10 12:37:37,029] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. + 8: [2023-05-10 12:37:37,029] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... + 8: [2023-05-10 12:37:37,029] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... + 8: [2023-05-10 12:37:37,029] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... + 8: [2023-05-10 12:37:37,029] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. + 8: [2023-05-10 12:37:37,029] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt... + 8: [2023-05-10 12:37:37,029] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt... + 8: [2023-05-10 12:37:37,029] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt... + 8: [2023-05-10 12:37:37,029] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt... + 8: [2023-05-10 12:37:37,029] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt... + 8: [2023-05-10 12:37:37,030] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. + 8: [2023-05-10 12:37:37,030] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. + 8: [2023-05-10 12:37:37,031] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. + 8: [2023-05-10 12:37:37,031] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. + 8: [2023-05-10 12:37:37,031] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... + 8: [2023-05-10 12:37:37,031] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... + 8: [2023-05-10 12:37:37,031] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... + 8: [2023-05-10 12:37:37,031] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +21: [2023-05-10 12:37:37,035] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt. +21: [2023-05-10 12:37:37,035] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt. +21: [2023-05-10 12:37:37,035] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt. +21: [2023-05-10 12:37:37,035] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt. +21: [2023-05-10 12:37:37,036] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +21: [2023-05-10 12:37:37,036] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +21: [2023-05-10 12:37:37,036] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... + 2: [2023-05-10 12:37:37,036] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt. +21: [2023-05-10 12:37:37,036] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +15: [2023-05-10 12:37:37,036] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt. +20: [2023-05-10 12:37:37,036] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt. +30: [2023-05-10 12:37:37,036] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt. +30: [2023-05-10 12:37:37,036] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt. +17: [2023-05-10 12:37:37,036] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt. +10: [2023-05-10 12:37:37,036] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt. +16: [2023-05-10 12:37:37,036] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt. +15: [2023-05-10 12:37:37,036] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt. + 2: [2023-05-10 12:37:37,036] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt. +15: [2023-05-10 12:37:37,036] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt. +30: [2023-05-10 12:37:37,036] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt. +17: [2023-05-10 12:37:37,036] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt. +10: [2023-05-10 12:37:37,036] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt. +10: [2023-05-10 12:37:37,036] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt. +16: [2023-05-10 12:37:37,036] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt. + 2: [2023-05-10 12:37:37,036] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt. +30: [2023-05-10 12:37:37,036] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt. +16: [2023-05-10 12:37:37,036] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt. +29: [2023-05-10 12:37:37,037] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt. +29: [2023-05-10 12:37:37,037] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt. +29: [2023-05-10 12:37:37,037] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt. +20: [2023-05-10 12:37:37,036] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt. +20: [2023-05-10 12:37:37,037] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt. +14: [2023-05-10 12:37:37,036] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt. +14: [2023-05-10 12:37:37,036] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt. +14: [2023-05-10 12:37:37,036] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt. +15: [2023-05-10 12:37:37,037] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt. +10: [2023-05-10 12:37:37,037] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt. +16: [2023-05-10 12:37:37,037] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt. +19: [2023-05-10 12:37:37,037] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt. +27: [2023-05-10 12:37:37,037] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt. + 2: [2023-05-10 12:37:37,037] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt. + 6: [2023-05-10 12:37:37,037] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt. +15: [2023-05-10 12:37:37,037] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +22: [2023-05-10 12:37:37,037] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt. +16: [2023-05-10 12:37:37,037] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +15: [2023-05-10 12:37:37,037] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +17: [2023-05-10 12:37:37,037] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt. +17: [2023-05-10 12:37:37,037] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... + 1: [2023-05-10 12:37:37,037] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt. + 1: [2023-05-10 12:37:37,037] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt. + 1: [2023-05-10 12:37:37,037] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt. +14: [2023-05-10 12:37:37,037] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt. +20: [2023-05-10 12:37:37,037] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +19: [2023-05-10 12:37:37,037] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt. + 6: [2023-05-10 12:37:37,037] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt. +16: [2023-05-10 12:37:37,037] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +29: [2023-05-10 12:37:37,037] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt. +15: [2023-05-10 12:37:37,037] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +30: [2023-05-10 12:37:37,037] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +30: [2023-05-10 12:37:37,037] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +26: [2023-05-10 12:37:37,037] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt. +26: [2023-05-10 12:37:37,037] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt. +17: [2023-05-10 12:37:37,037] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +20: [2023-05-10 12:37:37,037] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt. +19: [2023-05-10 12:37:37,037] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt. +16: [2023-05-10 12:37:37,037] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +30: [2023-05-10 12:37:37,037] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +30: [2023-05-10 12:37:37,037] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +26: [2023-05-10 12:37:37,037] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt. +17: [2023-05-10 12:37:37,037] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt. +20: [2023-05-10 12:37:37,037] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +23: [2023-05-10 12:37:37,037] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt. +23: [2023-05-10 12:37:37,037] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt. +23: [2023-05-10 12:37:37,037] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt. +16: [2023-05-10 12:37:37,037] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... + 3: [2023-05-10 12:37:37,037] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt. + 2: [2023-05-10 12:37:37,037] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +17: [2023-05-10 12:37:37,037] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +10: [2023-05-10 12:37:37,037] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +27: [2023-05-10 12:37:37,037] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt. + 6: [2023-05-10 12:37:37,037] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt. +29: [2023-05-10 12:37:37,037] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +29: [2023-05-10 12:37:37,037] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +29: [2023-05-10 12:37:37,037] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +15: [2023-05-10 12:37:37,037] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +20: [2023-05-10 12:37:37,037] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... + 2: [2023-05-10 12:37:37,037] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... + 8: [2023-05-10 12:37:37,037] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt. +10: [2023-05-10 12:37:37,037] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +19: [2023-05-10 12:37:37,037] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +19: [2023-05-10 12:37:37,037] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt. +27: [2023-05-10 12:37:37,037] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt. +22: [2023-05-10 12:37:37,037] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt. +22: [2023-05-10 12:37:37,037] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt. +27: [2023-05-10 12:37:37,037] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... + 2: [2023-05-10 12:37:37,037] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... + 6: [2023-05-10 12:37:37,037] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... + 2: [2023-05-10 12:37:37,037] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +10: [2023-05-10 12:37:37,037] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +27: [2023-05-10 12:37:37,037] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... + 6: [2023-05-10 12:37:37,037] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt. +10: [2023-05-10 12:37:37,037] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +27: [2023-05-10 12:37:37,037] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt. + 8: [2023-05-10 12:37:37,037] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt. + 8: [2023-05-10 12:37:37,037] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt. +22: [2023-05-10 12:37:37,037] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... + 6: [2023-05-10 12:37:37,037] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +29: [2023-05-10 12:37:37,037] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... + 1: [2023-05-10 12:37:37,037] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... + 1: [2023-05-10 12:37:37,037] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +14: [2023-05-10 12:37:37,037] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +19: [2023-05-10 12:37:37,037] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +18: [2023-05-10 12:37:37,037] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt. +22: [2023-05-10 12:37:37,037] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt. +20: [2023-05-10 12:37:37,037] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +27: [2023-05-10 12:37:37,037] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +14: [2023-05-10 12:37:37,037] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +24: [2023-05-10 12:37:37,037] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt. + 1: [2023-05-10 12:37:37,037] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +19: [2023-05-10 12:37:37,037] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +22: [2023-05-10 12:37:37,038] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +22: [2023-05-10 12:37:37,038] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +26: [2023-05-10 12:37:37,037] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt. + 9: [2023-05-10 12:37:37,038] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt. +17: [2023-05-10 12:37:37,038] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... + 0: [2023-05-10 12:37:37,038] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt. + 0: [2023-05-10 12:37:37,038] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt. +14: [2023-05-10 12:37:37,038] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +14: [2023-05-10 12:37:37,038] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +26: [2023-05-10 12:37:37,038] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... + 6: [2023-05-10 12:37:37,038] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... + 3: [2023-05-10 12:37:37,037] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt. + 3: [2023-05-10 12:37:37,037] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt. + 8: [2023-05-10 12:37:37,038] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt. +24: [2023-05-10 12:37:37,038] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt. +24: [2023-05-10 12:37:37,038] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt. +26: [2023-05-10 12:37:37,038] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +26: [2023-05-10 12:37:37,038] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +23: [2023-05-10 12:37:37,038] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +23: [2023-05-10 12:37:37,038] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +23: [2023-05-10 12:37:37,038] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... + 1: [2023-05-10 12:37:37,038] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt. + 0: [2023-05-10 12:37:37,038] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt. +19: [2023-05-10 12:37:37,038] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +18: [2023-05-10 12:37:37,037] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt. +18: [2023-05-10 12:37:37,037] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt. +13: [2023-05-10 12:37:37,038] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt. +13: [2023-05-10 12:37:37,038] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt. +23: [2023-05-10 12:37:37,038] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt. + 3: [2023-05-10 12:37:37,038] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt. +27: [2023-05-10 12:37:37,038] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... + 6: [2023-05-10 12:37:37,038] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... + 0: [2023-05-10 12:37:37,038] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt. +18: [2023-05-10 12:37:37,038] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt. +22: [2023-05-10 12:37:37,038] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +24: [2023-05-10 12:37:37,038] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt. +24: [2023-05-10 12:37:37,038] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... + 9: [2023-05-10 12:37:37,038] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt. + 9: [2023-05-10 12:37:37,038] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt. +28: [2023-05-10 12:37:37,038] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt. + 8: [2023-05-10 12:37:37,038] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +13: [2023-05-10 12:37:37,038] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt. +18: [2023-05-10 12:37:37,038] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +12: [2023-05-10 12:37:37,038] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt. + 8: [2023-05-10 12:37:37,038] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... + 1: [2023-05-10 12:37:37,038] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +18: [2023-05-10 12:37:37,038] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +24: [2023-05-10 12:37:37,038] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... + 9: [2023-05-10 12:37:37,038] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt. +26: [2023-05-10 12:37:37,038] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... + 9: [2023-05-10 12:37:37,038] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +18: [2023-05-10 12:37:37,038] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +24: [2023-05-10 12:37:37,038] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +23: [2023-05-10 12:37:37,038] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... + 8: [2023-05-10 12:37:37,038] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +31: [2023-05-10 12:37:37,038] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt. +31: [2023-05-10 12:37:37,038] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt. + 0: [2023-05-10 12:37:37,038] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... + 8: [2023-05-10 12:37:37,038] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +11: [2023-05-10 12:37:37,038] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt. +11: [2023-05-10 12:37:37,038] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt. +11: [2023-05-10 12:37:37,038] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt. + 9: [2023-05-10 12:37:37,038] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... + 9: [2023-05-10 12:37:37,038] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... + 5: [2023-05-10 12:37:37,038] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt. + 5: [2023-05-10 12:37:37,038] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt. + 7: [2023-05-10 12:37:37,038] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt. + 0: [2023-05-10 12:37:37,038] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... + 3: [2023-05-10 12:37:37,038] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... + 7: [2023-05-10 12:37:37,038] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt. +28: [2023-05-10 12:37:37,038] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt. +28: [2023-05-10 12:37:37,038] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt. + 7: [2023-05-10 12:37:37,038] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt. + 0: [2023-05-10 12:37:37,039] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... + 0: [2023-05-10 12:37:37,039] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +12: [2023-05-10 12:37:37,038] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt. +12: [2023-05-10 12:37:37,038] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt. + 3: [2023-05-10 12:37:37,039] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +13: [2023-05-10 12:37:37,039] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +13: [2023-05-10 12:37:37,039] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +25: [2023-05-10 12:37:37,039] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt. +25: [2023-05-10 12:37:37,039] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt. + 3: [2023-05-10 12:37:37,039] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +18: [2023-05-10 12:37:37,039] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +24: [2023-05-10 12:37:37,039] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... + 3: [2023-05-10 12:37:37,039] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +28: [2023-05-10 12:37:37,039] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt. + 5: [2023-05-10 12:37:37,038] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt. +11: [2023-05-10 12:37:37,039] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt. +12: [2023-05-10 12:37:37,039] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt. +31: [2023-05-10 12:37:37,038] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt. + 5: [2023-05-10 12:37:37,039] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt. +12: [2023-05-10 12:37:37,039] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... + 9: [2023-05-10 12:37:37,039] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +13: [2023-05-10 12:37:37,039] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt. +12: [2023-05-10 12:37:37,039] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +25: [2023-05-10 12:37:37,039] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt. +31: [2023-05-10 12:37:37,039] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt. +12: [2023-05-10 12:37:37,039] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... + 7: [2023-05-10 12:37:37,039] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt. +13: [2023-05-10 12:37:37,039] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... + 5: [2023-05-10 12:37:37,039] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +31: [2023-05-10 12:37:37,039] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +31: [2023-05-10 12:37:37,039] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +11: [2023-05-10 12:37:37,039] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +25: [2023-05-10 12:37:37,039] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt. + 5: [2023-05-10 12:37:37,039] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +11: [2023-05-10 12:37:37,039] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +31: [2023-05-10 12:37:37,039] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +11: [2023-05-10 12:37:37,039] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... + 5: [2023-05-10 12:37:37,039] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +28: [2023-05-10 12:37:37,040] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +12: [2023-05-10 12:37:37,040] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +28: [2023-05-10 12:37:37,040] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +28: [2023-05-10 12:37:37,040] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +28: [2023-05-10 12:37:37,040] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +11: [2023-05-10 12:37:37,040] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... + 5: [2023-05-10 12:37:37,040] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +13: [2023-05-10 12:37:37,040] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +25: [2023-05-10 12:37:37,040] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +31: [2023-05-10 12:37:37,040] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... + 7: [2023-05-10 12:37:37,040] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +25: [2023-05-10 12:37:37,040] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... + 7: [2023-05-10 12:37:37,040] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +25: [2023-05-10 12:37:37,040] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +25: [2023-05-10 12:37:37,041] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... + 7: [2023-05-10 12:37:37,041] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... + 7: [2023-05-10 12:37:37,041] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... + 4: [2023-05-10 12:37:37,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. + 4: [2023-05-10 12:37:37,019] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... + 4: [2023-05-10 12:37:37,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. + 4: [2023-05-10 12:37:37,020] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. + 4: [2023-05-10 12:37:37,020] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_00_model_states.pt. + 4: [2023-05-10 12:37:37,020] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... + 4: [2023-05-10 12:37:37,020] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... + 4: [2023-05-10 12:37:37,020] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... + 4: [2023-05-10 12:37:37,037] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt. + 4: [2023-05-10 12:37:37,037] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt. + 4: [2023-05-10 12:37:37,037] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt. + 4: [2023-05-10 12:37:37,038] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... + 4: [2023-05-10 12:37:37,038] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/mp_rank_01_model_states.pt. + 4: [2023-05-10 12:37:37,038] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... + 4: [2023-05-10 12:37:37,038] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... + 4: [2023-05-10 12:37:37,038] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +30: [2023-05-10 12:37:37,452] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +30: [2023-05-10 12:37:37,452] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +30: [2023-05-10 12:37:37,452] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +30: [2023-05-10 12:37:37,452] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +30: [2023-05-10 12:37:37,452] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +30: [2023-05-10 12:37:37,452] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +30: [2023-05-10 12:37:37,452] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +30: [2023-05-10 12:37:37,453] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +30: [2023-05-10 12:37:37,456] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +30: [2023-05-10 12:37:37,457] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt... +30: [2023-05-10 12:37:37,457] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt... +30: [2023-05-10 12:37:37,457] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt... +23: [2023-05-10 12:37:37,457] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +23: [2023-05-10 12:37:37,458] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +23: [2023-05-10 12:37:37,458] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +23: [2023-05-10 12:37:37,458] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +23: [2023-05-10 12:37:37,458] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +23: [2023-05-10 12:37:37,458] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +23: [2023-05-10 12:37:37,458] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +23: [2023-05-10 12:37:37,458] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +30: [2023-05-10 12:37:37,459] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +30: [2023-05-10 12:37:37,459] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +30: [2023-05-10 12:37:37,459] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +30: [2023-05-10 12:37:37,460] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt... +20: [2023-05-10 12:37:37,461] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +20: [2023-05-10 12:37:37,461] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +20: [2023-05-10 12:37:37,461] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +20: [2023-05-10 12:37:37,461] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +20: [2023-05-10 12:37:37,461] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +20: [2023-05-10 12:37:37,461] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +20: [2023-05-10 12:37:37,461] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +20: [2023-05-10 12:37:37,462] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +23: [2023-05-10 12:37:37,464] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +23: [2023-05-10 12:37:37,464] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +23: [2023-05-10 12:37:37,464] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt... +23: [2023-05-10 12:37:37,464] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt... +23: [2023-05-10 12:37:37,466] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +23: [2023-05-10 12:37:37,467] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt... +20: [2023-05-10 12:37:37,467] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +23: [2023-05-10 12:37:37,467] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +20: [2023-05-10 12:37:37,467] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt... +20: [2023-05-10 12:37:37,467] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +23: [2023-05-10 12:37:37,467] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt... +20: [2023-05-10 12:37:37,468] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt... +20: [2023-05-10 12:37:37,469] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt... +20: [2023-05-10 12:37:37,470] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt... +20: [2023-05-10 12:37:37,470] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +20: [2023-05-10 12:37:37,470] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +30: [2023-05-10 12:37:37,495] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +21: [2023-05-10 12:37:37,495] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +21: [2023-05-10 12:37:37,495] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +21: [2023-05-10 12:37:37,495] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +21: [2023-05-10 12:37:37,495] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +21: [2023-05-10 12:37:37,496] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +21: [2023-05-10 12:37:37,496] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +21: [2023-05-10 12:37:37,496] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. + 0: [2023-05-10 12:37:37,496] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. + 0: [2023-05-10 12:37:37,496] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. + 0: [2023-05-10 12:37:37,496] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. + 0: [2023-05-10 12:37:37,496] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. + 0: [2023-05-10 12:37:37,496] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +21: [2023-05-10 12:37:37,497] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. + 0: [2023-05-10 12:37:37,497] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. + 0: [2023-05-10 12:37:37,497] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +22: [2023-05-10 12:37:37,496] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +22: [2023-05-10 12:37:37,496] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +22: [2023-05-10 12:37:37,496] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +22: [2023-05-10 12:37:37,496] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +22: [2023-05-10 12:37:37,496] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +22: [2023-05-10 12:37:37,496] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +22: [2023-05-10 12:37:37,496] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +22: [2023-05-10 12:37:37,497] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. + 0: [2023-05-10 12:37:37,497] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +22: [2023-05-10 12:37:37,501] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +22: [2023-05-10 12:37:37,501] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +22: [2023-05-10 12:37:37,501] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +22: [2023-05-10 12:37:37,501] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt... +22: [2023-05-10 12:37:37,501] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt... +22: [2023-05-10 12:37:37,501] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt... + 0: [2023-05-10 12:37:37,501] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt... +22: [2023-05-10 12:37:37,502] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +22: [2023-05-10 12:37:37,502] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt... +21: [2023-05-10 12:37:37,502] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +21: [2023-05-10 12:37:37,502] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +21: [2023-05-10 12:37:37,502] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt... +21: [2023-05-10 12:37:37,502] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt... +21: [2023-05-10 12:37:37,502] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt... +21: [2023-05-10 12:37:37,502] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt... +21: [2023-05-10 12:37:37,502] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +21: [2023-05-10 12:37:37,502] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... + 0: [2023-05-10 12:37:37,504] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt... +23: [2023-05-10 12:37:37,504] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. + 0: [2023-05-10 12:37:37,504] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... + 0: [2023-05-10 12:37:37,505] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... + 0: [2023-05-10 12:37:37,505] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... + 0: [2023-05-10 12:37:37,505] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt... + 0: [2023-05-10 12:37:37,505] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... + 0: [2023-05-10 12:37:37,505] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt... +30: [2023-05-10 12:37:37,505] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +30: [2023-05-10 12:37:37,505] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +30: [2023-05-10 12:37:37,505] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +23: [2023-05-10 12:37:37,506] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +23: [2023-05-10 12:37:37,512] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +20: [2023-05-10 12:37:37,513] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +20: [2023-05-10 12:37:37,513] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +20: [2023-05-10 12:37:37,513] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +23: [2023-05-10 12:37:37,514] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +20: [2023-05-10 12:37:37,515] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +30: [2023-05-10 12:37:37,519] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +30: [2023-05-10 12:37:37,520] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +23: [2023-05-10 12:37:37,522] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +30: [2023-05-10 12:37:37,523] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +23: [2023-05-10 12:37:37,523] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +30: [2023-05-10 12:37:37,523] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +20: [2023-05-10 12:37:37,531] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +20: [2023-05-10 12:37:37,532] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +20: [2023-05-10 12:37:37,532] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +23: [2023-05-10 12:37:37,533] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +20: [2023-05-10 12:37:37,533] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... + 1: [2023-05-10 12:37:37,533] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. + 1: [2023-05-10 12:37:37,533] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. + 1: [2023-05-10 12:37:37,533] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. + 1: [2023-05-10 12:37:37,533] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. + 1: [2023-05-10 12:37:37,533] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. + 1: [2023-05-10 12:37:37,533] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. + 1: [2023-05-10 12:37:37,534] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +23: [2023-05-10 12:37:37,535] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... + 1: [2023-05-10 12:37:37,535] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +26: [2023-05-10 12:37:37,536] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +26: [2023-05-10 12:37:37,536] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +26: [2023-05-10 12:37:37,536] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +26: [2023-05-10 12:37:37,536] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +26: [2023-05-10 12:37:37,536] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +26: [2023-05-10 12:37:37,537] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. + 1: [2023-05-10 12:37:37,537] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt... +26: [2023-05-10 12:37:37,537] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. + 1: [2023-05-10 12:37:37,537] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... + 1: [2023-05-10 12:37:37,537] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt... +26: [2023-05-10 12:37:37,538] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +12: [2023-05-10 12:37:37,538] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +12: [2023-05-10 12:37:37,538] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +12: [2023-05-10 12:37:37,538] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +12: [2023-05-10 12:37:37,538] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +12: [2023-05-10 12:37:37,538] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +12: [2023-05-10 12:37:37,538] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +12: [2023-05-10 12:37:37,538] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +12: [2023-05-10 12:37:37,538] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. + 1: [2023-05-10 12:37:37,539] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +31: [2023-05-10 12:37:37,539] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. + 1: [2023-05-10 12:37:37,539] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt... +25: [2023-05-10 12:37:37,539] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +25: [2023-05-10 12:37:37,539] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. + 3: [2023-05-10 12:37:37,538] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. + 3: [2023-05-10 12:37:37,539] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. + 3: [2023-05-10 12:37:37,539] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. + 3: [2023-05-10 12:37:37,539] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. + 3: [2023-05-10 12:37:37,539] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. + 3: [2023-05-10 12:37:37,539] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. + 3: [2023-05-10 12:37:37,539] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. + 1: [2023-05-10 12:37:37,539] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt... +26: [2023-05-10 12:37:37,539] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... + 1: [2023-05-10 12:37:37,539] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... + 1: [2023-05-10 12:37:37,539] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +31: [2023-05-10 12:37:37,540] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +19: [2023-05-10 12:37:37,539] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +19: [2023-05-10 12:37:37,539] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +19: [2023-05-10 12:37:37,539] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +19: [2023-05-10 12:37:37,539] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +19: [2023-05-10 12:37:37,539] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +19: [2023-05-10 12:37:37,539] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +19: [2023-05-10 12:37:37,539] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +19: [2023-05-10 12:37:37,540] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +31: [2023-05-10 12:37:37,540] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +31: [2023-05-10 12:37:37,540] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +31: [2023-05-10 12:37:37,540] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +31: [2023-05-10 12:37:37,540] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +26: [2023-05-10 12:37:37,540] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt... +31: [2023-05-10 12:37:37,540] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. + 3: [2023-05-10 12:37:37,540] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +26: [2023-05-10 12:37:37,541] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +31: [2023-05-10 12:37:37,541] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +25: [2023-05-10 12:37:37,542] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +25: [2023-05-10 12:37:37,542] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +25: [2023-05-10 12:37:37,542] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +25: [2023-05-10 12:37:37,542] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +25: [2023-05-10 12:37:37,542] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +25: [2023-05-10 12:37:37,542] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +12: [2023-05-10 12:37:37,542] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +12: [2023-05-10 12:37:37,542] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt... +12: [2023-05-10 12:37:37,542] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt... + 3: [2023-05-10 12:37:37,542] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt... +28: [2023-05-10 12:37:37,543] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +28: [2023-05-10 12:37:37,543] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +28: [2023-05-10 12:37:37,543] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +28: [2023-05-10 12:37:37,543] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +31: [2023-05-10 12:37:37,543] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +12: [2023-05-10 12:37:37,543] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +28: [2023-05-10 12:37:37,543] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +28: [2023-05-10 12:37:37,543] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +28: [2023-05-10 12:37:37,543] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. + 3: [2023-05-10 12:37:37,543] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +26: [2023-05-10 12:37:37,543] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt... + 3: [2023-05-10 12:37:37,543] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt... +19: [2023-05-10 12:37:37,543] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... + 3: [2023-05-10 12:37:37,543] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt... +19: [2023-05-10 12:37:37,543] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +26: [2023-05-10 12:37:37,544] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +19: [2023-05-10 12:37:37,544] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... + 3: [2023-05-10 12:37:37,544] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +26: [2023-05-10 12:37:37,544] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... + 8: [2023-05-10 12:37:37,543] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. + 8: [2023-05-10 12:37:37,543] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. + 8: [2023-05-10 12:37:37,543] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. + 8: [2023-05-10 12:37:37,543] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. + 8: [2023-05-10 12:37:37,543] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. + 8: [2023-05-10 12:37:37,543] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. + 8: [2023-05-10 12:37:37,543] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +26: [2023-05-10 12:37:37,544] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt... + 3: [2023-05-10 12:37:37,544] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +31: [2023-05-10 12:37:37,544] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... + 8: [2023-05-10 12:37:37,544] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +25: [2023-05-10 12:37:37,544] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +19: [2023-05-10 12:37:37,544] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt... +25: [2023-05-10 12:37:37,545] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt... + 3: [2023-05-10 12:37:37,544] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt... +28: [2023-05-10 12:37:37,545] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +22: [2023-05-10 12:37:37,545] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +22: [2023-05-10 12:37:37,545] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +22: [2023-05-10 12:37:37,545] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +26: [2023-05-10 12:37:37,545] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt... +21: [2023-05-10 12:37:37,544] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +21: [2023-05-10 12:37:37,544] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +12: [2023-05-10 12:37:37,545] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +12: [2023-05-10 12:37:37,545] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... + 3: [2023-05-10 12:37:37,545] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +31: [2023-05-10 12:37:37,545] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +12: [2023-05-10 12:37:37,546] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt... +31: [2023-05-10 12:37:37,546] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt... +10: [2023-05-10 12:37:37,545] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +10: [2023-05-10 12:37:37,545] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +10: [2023-05-10 12:37:37,545] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +10: [2023-05-10 12:37:37,545] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +10: [2023-05-10 12:37:37,545] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +10: [2023-05-10 12:37:37,545] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +10: [2023-05-10 12:37:37,545] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +22: [2023-05-10 12:37:37,546] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +12: [2023-05-10 12:37:37,546] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt... +10: [2023-05-10 12:37:37,546] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +19: [2023-05-10 12:37:37,546] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt... +19: [2023-05-10 12:37:37,547] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt... +14: [2023-05-10 12:37:37,546] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +14: [2023-05-10 12:37:37,546] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +25: [2023-05-10 12:37:37,547] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +14: [2023-05-10 12:37:37,547] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +14: [2023-05-10 12:37:37,547] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +19: [2023-05-10 12:37:37,547] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +19: [2023-05-10 12:37:37,547] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt... +25: [2023-05-10 12:37:37,547] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt... +14: [2023-05-10 12:37:37,547] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +14: [2023-05-10 12:37:37,547] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +25: [2023-05-10 12:37:37,548] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +28: [2023-05-10 12:37:37,548] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt... +14: [2023-05-10 12:37:37,548] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. + 5: [2023-05-10 12:37:37,547] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. + 5: [2023-05-10 12:37:37,548] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +28: [2023-05-10 12:37:37,548] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +28: [2023-05-10 12:37:37,549] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +28: [2023-05-10 12:37:37,549] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt... +14: [2023-05-10 12:37:37,549] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +25: [2023-05-10 12:37:37,549] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt... +31: [2023-05-10 12:37:37,549] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt... +31: [2023-05-10 12:37:37,549] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt... +31: [2023-05-10 12:37:37,549] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +28: [2023-05-10 12:37:37,549] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt... +17: [2023-05-10 12:37:37,549] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +17: [2023-05-10 12:37:37,549] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +17: [2023-05-10 12:37:37,549] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +17: [2023-05-10 12:37:37,549] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +25: [2023-05-10 12:37:37,549] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt... +17: [2023-05-10 12:37:37,549] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +17: [2023-05-10 12:37:37,549] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +17: [2023-05-10 12:37:37,549] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +25: [2023-05-10 12:37:37,549] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +28: [2023-05-10 12:37:37,549] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +17: [2023-05-10 12:37:37,550] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. + 8: [2023-05-10 12:37:37,550] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +31: [2023-05-10 12:37:37,550] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt... + 5: [2023-05-10 12:37:37,550] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. + 5: [2023-05-10 12:37:37,550] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. + 5: [2023-05-10 12:37:37,550] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. + 5: [2023-05-10 12:37:37,550] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. + 5: [2023-05-10 12:37:37,550] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +24: [2023-05-10 12:37:37,549] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +24: [2023-05-10 12:37:37,549] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +24: [2023-05-10 12:37:37,550] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +10: [2023-05-10 12:37:37,550] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +24: [2023-05-10 12:37:37,550] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +24: [2023-05-10 12:37:37,550] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +24: [2023-05-10 12:37:37,550] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +24: [2023-05-10 12:37:37,550] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. + 5: [2023-05-10 12:37:37,550] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +10: [2023-05-10 12:37:37,550] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +10: [2023-05-10 12:37:37,550] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... + 4: [2023-05-10 12:37:37,550] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. + 4: [2023-05-10 12:37:37,550] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. + 8: [2023-05-10 12:37:37,550] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt... + 8: [2023-05-10 12:37:37,550] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt... +14: [2023-05-10 12:37:37,550] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +10: [2023-05-10 12:37:37,550] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... + 4: [2023-05-10 12:37:37,550] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. + 4: [2023-05-10 12:37:37,550] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. + 4: [2023-05-10 12:37:37,550] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +28: [2023-05-10 12:37:37,550] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +24: [2023-05-10 12:37:37,550] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. + 4: [2023-05-10 12:37:37,550] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. + 4: [2023-05-10 12:37:37,550] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +10: [2023-05-10 12:37:37,550] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt... +10: [2023-05-10 12:37:37,550] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt... +10: [2023-05-10 12:37:37,550] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt... +21: [2023-05-10 12:37:37,551] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. + 4: [2023-05-10 12:37:37,551] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +21: [2023-05-10 12:37:37,551] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +14: [2023-05-10 12:37:37,551] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt... +28: [2023-05-10 12:37:37,551] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt... +14: [2023-05-10 12:37:37,551] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +10: [2023-05-10 12:37:37,551] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt... +14: [2023-05-10 12:37:37,551] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +18: [2023-05-10 12:37:37,551] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +14: [2023-05-10 12:37:37,552] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt... +14: [2023-05-10 12:37:37,552] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt... +14: [2023-05-10 12:37:37,552] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +17: [2023-05-10 12:37:37,552] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... + 8: [2023-05-10 12:37:37,552] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +18: [2023-05-10 12:37:37,553] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +18: [2023-05-10 12:37:37,553] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +18: [2023-05-10 12:37:37,553] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +18: [2023-05-10 12:37:37,553] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +18: [2023-05-10 12:37:37,553] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. + 5: [2023-05-10 12:37:37,553] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt... +14: [2023-05-10 12:37:37,553] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt... +18: [2023-05-10 12:37:37,553] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. + 8: [2023-05-10 12:37:37,553] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... + 8: [2023-05-10 12:37:37,553] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +17: [2023-05-10 12:37:37,554] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +17: [2023-05-10 12:37:37,554] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt... +17: [2023-05-10 12:37:37,554] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt... + 0: [2023-05-10 12:37:37,554] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. + 0: [2023-05-10 12:37:37,554] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. + 0: [2023-05-10 12:37:37,554] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. + 0: [2023-05-10 12:37:37,554] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +24: [2023-05-10 12:37:37,554] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +24: [2023-05-10 12:37:37,554] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt... +17: [2023-05-10 12:37:37,554] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... + 8: [2023-05-10 12:37:37,554] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt... +24: [2023-05-10 12:37:37,554] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt... + 5: [2023-05-10 12:37:37,554] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... + 8: [2023-05-10 12:37:37,554] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt... +17: [2023-05-10 12:37:37,554] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt... + 4: [2023-05-10 12:37:37,554] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +24: [2023-05-10 12:37:37,554] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +18: [2023-05-10 12:37:37,554] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. + 4: [2023-05-10 12:37:37,555] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt... + 4: [2023-05-10 12:37:37,555] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt... + 4: [2023-05-10 12:37:37,555] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt... +17: [2023-05-10 12:37:37,555] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +24: [2023-05-10 12:37:37,555] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt... +17: [2023-05-10 12:37:37,555] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt... + 4: [2023-05-10 12:37:37,555] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt... + 4: [2023-05-10 12:37:37,556] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... + 4: [2023-05-10 12:37:37,556] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... + 4: [2023-05-10 12:37:37,556] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +18: [2023-05-10 12:37:37,557] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt... +24: [2023-05-10 12:37:37,557] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... + 5: [2023-05-10 12:37:37,557] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +24: [2023-05-10 12:37:37,557] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +24: [2023-05-10 12:37:37,557] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt... +18: [2023-05-10 12:37:37,557] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt... + 9: [2023-05-10 12:37:37,557] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. + 9: [2023-05-10 12:37:37,558] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. + 9: [2023-05-10 12:37:37,558] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. + 9: [2023-05-10 12:37:37,558] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. + 9: [2023-05-10 12:37:37,558] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. + 6: [2023-05-10 12:37:37,558] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. + 6: [2023-05-10 12:37:37,558] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. + 6: [2023-05-10 12:37:37,558] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. + 6: [2023-05-10 12:37:37,558] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. + 6: [2023-05-10 12:37:37,558] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. + 6: [2023-05-10 12:37:37,558] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. + 6: [2023-05-10 12:37:37,558] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. + 9: [2023-05-10 12:37:37,559] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. + 9: [2023-05-10 12:37:37,559] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. + 6: [2023-05-10 12:37:37,559] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. + 9: [2023-05-10 12:37:37,559] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +21: [2023-05-10 12:37:37,561] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +21: [2023-05-10 12:37:37,561] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... + 5: [2023-05-10 12:37:37,561] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt... + 5: [2023-05-10 12:37:37,561] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt... + 5: [2023-05-10 12:37:37,561] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt... + 5: [2023-05-10 12:37:37,561] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +18: [2023-05-10 12:37:37,561] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +18: [2023-05-10 12:37:37,561] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt... + 5: [2023-05-10 12:37:37,562] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +18: [2023-05-10 12:37:37,562] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +18: [2023-05-10 12:37:37,562] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +22: [2023-05-10 12:37:37,562] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +22: [2023-05-10 12:37:37,562] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +22: [2023-05-10 12:37:37,562] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... + 9: [2023-05-10 12:37:37,562] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +18: [2023-05-10 12:37:37,562] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt... +22: [2023-05-10 12:37:37,562] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... + 9: [2023-05-10 12:37:37,562] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +27: [2023-05-10 12:37:37,562] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +27: [2023-05-10 12:37:37,562] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +27: [2023-05-10 12:37:37,562] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +27: [2023-05-10 12:37:37,562] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +27: [2023-05-10 12:37:37,562] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +27: [2023-05-10 12:37:37,562] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +27: [2023-05-10 12:37:37,562] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +27: [2023-05-10 12:37:37,563] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +18: [2023-05-10 12:37:37,563] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... + 9: [2023-05-10 12:37:37,563] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... + 9: [2023-05-10 12:37:37,564] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt... + 9: [2023-05-10 12:37:37,564] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... + 9: [2023-05-10 12:37:37,564] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt... +13: [2023-05-10 12:37:37,564] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +13: [2023-05-10 12:37:37,564] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +13: [2023-05-10 12:37:37,564] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +13: [2023-05-10 12:37:37,565] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +13: [2023-05-10 12:37:37,565] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +13: [2023-05-10 12:37:37,565] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +13: [2023-05-10 12:37:37,565] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. + 9: [2023-05-10 12:37:37,565] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt... +13: [2023-05-10 12:37:37,565] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. + 9: [2023-05-10 12:37:37,565] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt... +27: [2023-05-10 12:37:37,567] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +27: [2023-05-10 12:37:37,567] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +21: [2023-05-10 12:37:37,567] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +21: [2023-05-10 12:37:37,567] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +27: [2023-05-10 12:37:37,567] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt... +27: [2023-05-10 12:37:37,567] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt... +27: [2023-05-10 12:37:37,567] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt... +27: [2023-05-10 12:37:37,568] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +27: [2023-05-10 12:37:37,568] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +27: [2023-05-10 12:37:37,568] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt... + 6: [2023-05-10 12:37:37,569] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... + 6: [2023-05-10 12:37:37,569] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... + 6: [2023-05-10 12:37:37,569] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... + 6: [2023-05-10 12:37:37,569] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... + 6: [2023-05-10 12:37:37,569] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt... + 6: [2023-05-10 12:37:37,569] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt... + 6: [2023-05-10 12:37:37,570] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt... + 6: [2023-05-10 12:37:37,570] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt... +13: [2023-05-10 12:37:37,570] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +13: [2023-05-10 12:37:37,571] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt... +13: [2023-05-10 12:37:37,571] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt... + 0: [2023-05-10 12:37:37,572] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... + 7: [2023-05-10 12:37:37,571] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. + 7: [2023-05-10 12:37:37,572] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. + 7: [2023-05-10 12:37:37,572] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. + 7: [2023-05-10 12:37:37,572] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. + 0: [2023-05-10 12:37:37,572] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... + 7: [2023-05-10 12:37:37,572] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. + 7: [2023-05-10 12:37:37,572] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. + 7: [2023-05-10 12:37:37,572] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. + 0: [2023-05-10 12:37:37,573] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... + 0: [2023-05-10 12:37:37,573] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +13: [2023-05-10 12:37:37,574] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +13: [2023-05-10 12:37:37,574] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +13: [2023-05-10 12:37:37,575] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt... +15: [2023-05-10 12:37:37,574] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +15: [2023-05-10 12:37:37,575] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +13: [2023-05-10 12:37:37,575] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt... +15: [2023-05-10 12:37:37,575] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +15: [2023-05-10 12:37:37,575] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +13: [2023-05-10 12:37:37,575] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +15: [2023-05-10 12:37:37,575] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +15: [2023-05-10 12:37:37,575] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +15: [2023-05-10 12:37:37,575] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. + 7: [2023-05-10 12:37:37,576] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +15: [2023-05-10 12:37:37,577] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +15: [2023-05-10 12:37:37,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +29: [2023-05-10 12:37:37,578] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +29: [2023-05-10 12:37:37,578] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +16: [2023-05-10 12:37:37,578] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +16: [2023-05-10 12:37:37,578] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +16: [2023-05-10 12:37:37,578] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +16: [2023-05-10 12:37:37,578] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +16: [2023-05-10 12:37:37,578] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +16: [2023-05-10 12:37:37,578] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +16: [2023-05-10 12:37:37,578] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +29: [2023-05-10 12:37:37,579] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +29: [2023-05-10 12:37:37,579] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. + 7: [2023-05-10 12:37:37,579] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt... + 7: [2023-05-10 12:37:37,579] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt... +26: [2023-05-10 12:37:37,579] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +16: [2023-05-10 12:37:37,579] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +29: [2023-05-10 12:37:37,579] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +29: [2023-05-10 12:37:37,579] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +29: [2023-05-10 12:37:37,579] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. + 1: [2023-05-10 12:37:37,579] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. + 7: [2023-05-10 12:37:37,579] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +29: [2023-05-10 12:37:37,579] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. + 7: [2023-05-10 12:37:37,579] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt... + 7: [2023-05-10 12:37:37,580] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... + 7: [2023-05-10 12:37:37,580] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt... + 7: [2023-05-10 12:37:37,581] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +29: [2023-05-10 12:37:37,581] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +15: [2023-05-10 12:37:37,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +15: [2023-05-10 12:37:37,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +29: [2023-05-10 12:37:37,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt... +26: [2023-05-10 12:37:37,583] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +11: [2023-05-10 12:37:37,582] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +11: [2023-05-10 12:37:37,582] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +11: [2023-05-10 12:37:37,582] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +11: [2023-05-10 12:37:37,582] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +11: [2023-05-10 12:37:37,582] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. + 3: [2023-05-10 12:37:37,582] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +11: [2023-05-10 12:37:37,582] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +11: [2023-05-10 12:37:37,582] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +15: [2023-05-10 12:37:37,583] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt... +15: [2023-05-10 12:37:37,583] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt... +15: [2023-05-10 12:37:37,583] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt... +15: [2023-05-10 12:37:37,583] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt... +19: [2023-05-10 12:37:37,582] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +16: [2023-05-10 12:37:37,583] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +31: [2023-05-10 12:37:37,582] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +11: [2023-05-10 12:37:37,583] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +29: [2023-05-10 12:37:37,583] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt... +29: [2023-05-10 12:37:37,583] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +16: [2023-05-10 12:37:37,583] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +16: [2023-05-10 12:37:37,583] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +16: [2023-05-10 12:37:37,583] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt... +16: [2023-05-10 12:37:37,583] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt... +16: [2023-05-10 12:37:37,583] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt... +16: [2023-05-10 12:37:37,584] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt... + 1: [2023-05-10 12:37:37,583] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. + 1: [2023-05-10 12:37:37,583] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +16: [2023-05-10 12:37:37,584] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +12: [2023-05-10 12:37:37,584] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +15: [2023-05-10 12:37:37,584] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... + 7: [2023-05-10 12:37:37,584] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +29: [2023-05-10 12:37:37,584] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt... +29: [2023-05-10 12:37:37,584] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +29: [2023-05-10 12:37:37,585] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +29: [2023-05-10 12:37:37,585] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt... +12: [2023-05-10 12:37:37,585] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +25: [2023-05-10 12:37:37,586] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +25: [2023-05-10 12:37:37,586] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +19: [2023-05-10 12:37:37,586] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +19: [2023-05-10 12:37:37,586] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +19: [2023-05-10 12:37:37,586] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. + 1: [2023-05-10 12:37:37,586] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +26: [2023-05-10 12:37:37,587] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +31: [2023-05-10 12:37:37,587] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +31: [2023-05-10 12:37:37,587] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +11: [2023-05-10 12:37:37,587] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt... +11: [2023-05-10 12:37:37,587] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... + 2: [2023-05-10 12:37:37,587] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. + 2: [2023-05-10 12:37:37,587] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. + 2: [2023-05-10 12:37:37,587] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. + 2: [2023-05-10 12:37:37,588] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. + 2: [2023-05-10 12:37:37,588] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. + 2: [2023-05-10 12:37:37,588] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. + 2: [2023-05-10 12:37:37,588] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +11: [2023-05-10 12:37:37,588] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt... +26: [2023-05-10 12:37:37,588] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +12: [2023-05-10 12:37:37,588] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +11: [2023-05-10 12:37:37,588] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... + 8: [2023-05-10 12:37:37,589] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. + 3: [2023-05-10 12:37:37,588] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. + 3: [2023-05-10 12:37:37,588] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. + 3: [2023-05-10 12:37:37,588] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. + 2: [2023-05-10 12:37:37,589] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +28: [2023-05-10 12:37:37,589] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +14: [2023-05-10 12:37:37,589] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +12: [2023-05-10 12:37:37,590] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +31: [2023-05-10 12:37:37,590] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +25: [2023-05-10 12:37:37,591] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +11: [2023-05-10 12:37:37,591] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt... +11: [2023-05-10 12:37:37,591] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt... +11: [2023-05-10 12:37:37,591] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +11: [2023-05-10 12:37:37,592] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +26: [2023-05-10 12:37:37,592] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +25: [2023-05-10 12:37:37,592] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. + 2: [2023-05-10 12:37:37,593] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... + 2: [2023-05-10 12:37:37,593] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +28: [2023-05-10 12:37:37,593] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. + 2: [2023-05-10 12:37:37,594] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt... +28: [2023-05-10 12:37:37,594] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +28: [2023-05-10 12:37:37,594] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. + 2: [2023-05-10 12:37:37,594] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt... + 4: [2023-05-10 12:37:37,594] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. + 2: [2023-05-10 12:37:37,595] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt... + 2: [2023-05-10 12:37:37,595] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... +10: [2023-05-10 12:37:37,596] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +17: [2023-05-10 12:37:37,596] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +17: [2023-05-10 12:37:37,596] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +19: [2023-05-10 12:37:37,596] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +26: [2023-05-10 12:37:37,596] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... + 2: [2023-05-10 12:37:37,596] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt... + 3: [2023-05-10 12:37:37,597] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +24: [2023-05-10 12:37:37,596] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +24: [2023-05-10 12:37:37,596] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +14: [2023-05-10 12:37:37,597] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +14: [2023-05-10 12:37:37,597] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +14: [2023-05-10 12:37:37,598] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. + 2: [2023-05-10 12:37:37,598] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt... + 8: [2023-05-10 12:37:37,597] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. + 8: [2023-05-10 12:37:37,597] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. + 8: [2023-05-10 12:37:37,597] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +31: [2023-05-10 12:37:37,598] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... + 1: [2023-05-10 12:37:37,600] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... + 1: [2023-05-10 12:37:37,600] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... + 1: [2023-05-10 12:37:37,600] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +12: [2023-05-10 12:37:37,600] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +12: [2023-05-10 12:37:37,600] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +19: [2023-05-10 12:37:37,601] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +19: [2023-05-10 12:37:37,601] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +19: [2023-05-10 12:37:37,602] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +24: [2023-05-10 12:37:37,602] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +24: [2023-05-10 12:37:37,602] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +17: [2023-05-10 12:37:37,602] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +17: [2023-05-10 12:37:37,602] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. + 9: [2023-05-10 12:37:37,602] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +31: [2023-05-10 12:37:37,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +25: [2023-05-10 12:37:37,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +31: [2023-05-10 12:37:37,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... + 5: [2023-05-10 12:37:37,602] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. + 5: [2023-05-10 12:37:37,602] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +26: [2023-05-10 12:37:37,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +25: [2023-05-10 12:37:37,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... + 8: [2023-05-10 12:37:37,604] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... + 3: [2023-05-10 12:37:37,604] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +10: [2023-05-10 12:37:37,604] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +10: [2023-05-10 12:37:37,604] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. + 4: [2023-05-10 12:37:37,604] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +10: [2023-05-10 12:37:37,604] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. + 4: [2023-05-10 12:37:37,604] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +26: [2023-05-10 12:37:37,604] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +12: [2023-05-10 12:37:37,604] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... + 4: [2023-05-10 12:37:37,604] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +14: [2023-05-10 12:37:37,605] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +28: [2023-05-10 12:37:37,605] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... + 3: [2023-05-10 12:37:37,605] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... + 3: [2023-05-10 12:37:37,605] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +12: [2023-05-10 12:37:37,605] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... + 9: [2023-05-10 12:37:37,605] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. + 9: [2023-05-10 12:37:37,605] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +31: [2023-05-10 12:37:37,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... + 9: [2023-05-10 12:37:37,606] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +27: [2023-05-10 12:37:37,606] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. + 1: [2023-05-10 12:37:37,607] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +18: [2023-05-10 12:37:37,608] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +18: [2023-05-10 12:37:37,608] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +18: [2023-05-10 12:37:37,608] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. + 4: [2023-05-10 12:37:37,608] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +25: [2023-05-10 12:37:37,608] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +18: [2023-05-10 12:37:37,609] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +25: [2023-05-10 12:37:37,609] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +28: [2023-05-10 12:37:37,610] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +27: [2023-05-10 12:37:37,610] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +28: [2023-05-10 12:37:37,611] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +28: [2023-05-10 12:37:37,611] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +14: [2023-05-10 12:37:37,611] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +24: [2023-05-10 12:37:37,611] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +14: [2023-05-10 12:37:37,611] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +14: [2023-05-10 12:37:37,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... + 5: [2023-05-10 12:37:37,612] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. + 5: [2023-05-10 12:37:37,612] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +27: [2023-05-10 12:37:37,613] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +27: [2023-05-10 12:37:37,613] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +10: [2023-05-10 12:37:37,613] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +24: [2023-05-10 12:37:37,614] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +17: [2023-05-10 12:37:37,614] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... + 8: [2023-05-10 12:37:37,615] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +17: [2023-05-10 12:37:37,615] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... + 9: [2023-05-10 12:37:37,616] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... + 8: [2023-05-10 12:37:37,616] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... + 6: [2023-05-10 12:37:37,617] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. + 8: [2023-05-10 12:37:37,617] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +15: [2023-05-10 12:37:37,618] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +24: [2023-05-10 12:37:37,618] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... + 7: [2023-05-10 12:37:37,618] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. + 6: [2023-05-10 12:37:37,618] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. + 9: [2023-05-10 12:37:37,619] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... + 6: [2023-05-10 12:37:37,619] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. + 6: [2023-05-10 12:37:37,619] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +24: [2023-05-10 12:37:37,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +13: [2023-05-10 12:37:37,620] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. + 9: [2023-05-10 12:37:37,621] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... + 4: [2023-05-10 12:37:37,621] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +29: [2023-05-10 12:37:37,621] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. + 9: [2023-05-10 12:37:37,622] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +17: [2023-05-10 12:37:37,622] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +16: [2023-05-10 12:37:37,623] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +13: [2023-05-10 12:37:37,624] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +13: [2023-05-10 12:37:37,624] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +13: [2023-05-10 12:37:37,624] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +27: [2023-05-10 12:37:37,624] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +29: [2023-05-10 12:37:37,624] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. + 5: [2023-05-10 12:37:37,624] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... + 5: [2023-05-10 12:37:37,625] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +29: [2023-05-10 12:37:37,625] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +29: [2023-05-10 12:37:37,625] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. + 4: [2023-05-10 12:37:37,625] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... + 7: [2023-05-10 12:37:37,625] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. + 7: [2023-05-10 12:37:37,625] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. + 4: [2023-05-10 12:37:37,626] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +17: [2023-05-10 12:37:37,627] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +10: [2023-05-10 12:37:37,627] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +10: [2023-05-10 12:37:37,627] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +18: [2023-05-10 12:37:37,627] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +18: [2023-05-10 12:37:37,627] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +10: [2023-05-10 12:37:37,627] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... + 7: [2023-05-10 12:37:37,628] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +11: [2023-05-10 12:37:37,628] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +11: [2023-05-10 12:37:37,628] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +18: [2023-05-10 12:37:37,629] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +16: [2023-05-10 12:37:37,629] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +16: [2023-05-10 12:37:37,629] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +16: [2023-05-10 12:37:37,629] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +18: [2023-05-10 12:37:37,629] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +15: [2023-05-10 12:37:37,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. + 5: [2023-05-10 12:37:37,632] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +27: [2023-05-10 12:37:37,632] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +15: [2023-05-10 12:37:37,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +15: [2023-05-10 12:37:37,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. + 5: [2023-05-10 12:37:37,632] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +15: [2023-05-10 12:37:37,632] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +11: [2023-05-10 12:37:37,634] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +11: [2023-05-10 12:37:37,634] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. + 7: [2023-05-10 12:37:37,635] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +27: [2023-05-10 12:37:37,635] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +27: [2023-05-10 12:37:37,636] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... + 2: [2023-05-10 12:37:37,636] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. + 2: [2023-05-10 12:37:37,636] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. + 6: [2023-05-10 12:37:37,638] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... + 6: [2023-05-10 12:37:37,639] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... + 6: [2023-05-10 12:37:37,639] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +29: [2023-05-10 12:37:37,639] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +29: [2023-05-10 12:37:37,639] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... + 6: [2023-05-10 12:37:37,640] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... + 2: [2023-05-10 12:37:37,640] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. + 2: [2023-05-10 12:37:37,640] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_00-model_states.pt. +16: [2023-05-10 12:37:37,641] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +13: [2023-05-10 12:37:37,642] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +29: [2023-05-10 12:37:37,642] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +29: [2023-05-10 12:37:37,643] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +16: [2023-05-10 12:37:37,643] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +13: [2023-05-10 12:37:37,644] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +13: [2023-05-10 12:37:37,644] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +13: [2023-05-10 12:37:37,645] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +16: [2023-05-10 12:37:37,645] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +16: [2023-05-10 12:37:37,645] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... + 7: [2023-05-10 12:37:37,645] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... + 7: [2023-05-10 12:37:37,645] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +11: [2023-05-10 12:37:37,648] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +11: [2023-05-10 12:37:37,648] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... + 7: [2023-05-10 12:37:37,648] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +15: [2023-05-10 12:37:37,651] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +15: [2023-05-10 12:37:37,651] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +11: [2023-05-10 12:37:37,653] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +15: [2023-05-10 12:37:37,654] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +11: [2023-05-10 12:37:37,655] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... + 2: [2023-05-10 12:37:37,659] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... + 2: [2023-05-10 12:37:37,660] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... + 2: [2023-05-10 12:37:37,660] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... + 2: [2023-05-10 12:37:37,660] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... + 0: [2023-05-10 12:37:37,864] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt. + 0: [2023-05-10 12:37:37,864] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt. + 0: [2023-05-10 12:37:37,865] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt. + 0: [2023-05-10 12:37:37,865] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt. +22: [2023-05-10 12:37:37,865] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt. +22: [2023-05-10 12:37:37,865] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt. +22: [2023-05-10 12:37:37,866] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt. +22: [2023-05-10 12:37:37,866] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt. + 3: [2023-05-10 12:37:37,876] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. + 3: [2023-05-10 12:37:37,876] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. + 3: [2023-05-10 12:37:37,877] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. + 3: [2023-05-10 12:37:37,878] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. + 3: [2023-05-10 12:37:37,878] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... + 3: [2023-05-10 12:37:37,878] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... + 3: [2023-05-10 12:37:37,879] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... + 3: [2023-05-10 12:37:37,879] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... + 0: [2023-05-10 12:37:37,880] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... + 0: [2023-05-10 12:37:37,880] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... + 0: [2023-05-10 12:37:37,881] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... + 0: [2023-05-10 12:37:37,881] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +22: [2023-05-10 12:37:37,888] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +20: [2023-05-10 12:37:37,888] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +20: [2023-05-10 12:37:37,888] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +20: [2023-05-10 12:37:37,888] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +22: [2023-05-10 12:37:37,888] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +20: [2023-05-10 12:37:37,888] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt. +20: [2023-05-10 12:37:37,888] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +22: [2023-05-10 12:37:37,888] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +20: [2023-05-10 12:37:37,888] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt. +20: [2023-05-10 12:37:37,889] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt. +20: [2023-05-10 12:37:37,889] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt. +20: [2023-05-10 12:37:37,890] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +20: [2023-05-10 12:37:37,890] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +20: [2023-05-10 12:37:37,890] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +20: [2023-05-10 12:37:37,890] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +22: [2023-05-10 12:37:37,891] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +26: [2023-05-10 12:37:37,897] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt. +26: [2023-05-10 12:37:37,898] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt. +26: [2023-05-10 12:37:37,898] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt. + 1: [2023-05-10 12:37:37,897] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt. + 1: [2023-05-10 12:37:37,898] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt. + 1: [2023-05-10 12:37:37,898] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt. +26: [2023-05-10 12:37:37,898] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt. +12: [2023-05-10 12:37:37,898] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt. +12: [2023-05-10 12:37:37,898] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt. +12: [2023-05-10 12:37:37,898] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt. +12: [2023-05-10 12:37:37,899] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt. + 1: [2023-05-10 12:37:37,899] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt. + 3: [2023-05-10 12:37:37,900] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. + 3: [2023-05-10 12:37:37,904] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. + 3: [2023-05-10 12:37:37,904] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +22: [2023-05-10 12:37:37,905] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +22: [2023-05-10 12:37:37,906] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +22: [2023-05-10 12:37:37,906] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +22: [2023-05-10 12:37:37,906] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +31: [2023-05-10 12:37:37,906] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +31: [2023-05-10 12:37:37,906] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +31: [2023-05-10 12:37:37,906] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +31: [2023-05-10 12:37:37,906] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. + 3: [2023-05-10 12:37:37,907] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +20: [2023-05-10 12:37:37,907] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +31: [2023-05-10 12:37:37,908] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +31: [2023-05-10 12:37:37,908] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +26: [2023-05-10 12:37:37,907] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +26: [2023-05-10 12:37:37,908] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +20: [2023-05-10 12:37:37,908] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +31: [2023-05-10 12:37:37,908] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +20: [2023-05-10 12:37:37,908] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +31: [2023-05-10 12:37:37,908] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +20: [2023-05-10 12:37:37,908] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +22: [2023-05-10 12:37:37,909] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +22: [2023-05-10 12:37:37,910] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +26: [2023-05-10 12:37:37,910] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +22: [2023-05-10 12:37:37,910] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +26: [2023-05-10 12:37:37,910] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +22: [2023-05-10 12:37:37,910] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... + 3: [2023-05-10 12:37:37,911] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +26: [2023-05-10 12:37:37,912] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +26: [2023-05-10 12:37:37,912] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +26: [2023-05-10 12:37:37,913] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... + 1: [2023-05-10 12:37:37,914] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +12: [2023-05-10 12:37:37,914] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +12: [2023-05-10 12:37:37,914] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +26: [2023-05-10 12:37:37,915] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +26: [2023-05-10 12:37:37,915] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... + 1: [2023-05-10 12:37:37,915] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... + 1: [2023-05-10 12:37:37,915] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +12: [2023-05-10 12:37:37,915] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... + 1: [2023-05-10 12:37:37,916] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +12: [2023-05-10 12:37:37,916] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +26: [2023-05-10 12:37:37,916] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... + 3: [2023-05-10 12:37:37,918] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +26: [2023-05-10 12:37:37,918] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... + 3: [2023-05-10 12:37:37,918] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +26: [2023-05-10 12:37:37,919] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +20: [2023-05-10 12:37:37,919] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. + 3: [2023-05-10 12:37:37,919] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +20: [2023-05-10 12:37:37,919] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +22: [2023-05-10 12:37:37,923] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +20: [2023-05-10 12:37:37,924] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +22: [2023-05-10 12:37:37,925] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt... +22: [2023-05-10 12:37:37,925] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +22: [2023-05-10 12:37:37,925] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +22: [2023-05-10 12:37:37,925] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +31: [2023-05-10 12:37:37,928] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +20: [2023-05-10 12:37:37,929] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +22: [2023-05-10 12:37:37,929] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt... +22: [2023-05-10 12:37:37,929] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt... +22: [2023-05-10 12:37:37,929] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt... +31: [2023-05-10 12:37:37,930] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +31: [2023-05-10 12:37:37,932] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +31: [2023-05-10 12:37:37,932] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +26: [2023-05-10 12:37:37,933] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +20: [2023-05-10 12:37:37,934] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +20: [2023-05-10 12:37:37,935] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +26: [2023-05-10 12:37:37,936] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +20: [2023-05-10 12:37:37,936] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +22: [2023-05-10 12:37:37,937] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +20: [2023-05-10 12:37:37,940] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt... +31: [2023-05-10 12:37:37,940] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +22: [2023-05-10 12:37:37,941] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +22: [2023-05-10 12:37:37,941] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +22: [2023-05-10 12:37:37,941] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +20: [2023-05-10 12:37:37,940] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +31: [2023-05-10 12:37:37,943] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +20: [2023-05-10 12:37:37,943] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +20: [2023-05-10 12:37:37,944] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +20: [2023-05-10 12:37:37,944] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +26: [2023-05-10 12:37:37,944] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +26: [2023-05-10 12:37:37,945] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +31: [2023-05-10 12:37:37,945] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +31: [2023-05-10 12:37:37,945] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +20: [2023-05-10 12:37:37,945] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt... +20: [2023-05-10 12:37:37,946] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +20: [2023-05-10 12:37:37,946] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt... +26: [2023-05-10 12:37:37,947] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt... +20: [2023-05-10 12:37:37,948] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt... +26: [2023-05-10 12:37:37,948] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +26: [2023-05-10 12:37:37,948] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +26: [2023-05-10 12:37:37,949] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +26: [2023-05-10 12:37:37,953] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +26: [2023-05-10 12:37:37,955] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt... +26: [2023-05-10 12:37:37,961] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +22: [2023-05-10 12:37:37,962] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +30: [2023-05-10 12:37:37,962] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +30: [2023-05-10 12:37:37,962] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +30: [2023-05-10 12:37:37,962] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +30: [2023-05-10 12:37:37,962] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +22: [2023-05-10 12:37:37,963] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +22: [2023-05-10 12:37:37,963] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +26: [2023-05-10 12:37:37,963] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +22: [2023-05-10 12:37:37,963] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +26: [2023-05-10 12:37:37,964] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +26: [2023-05-10 12:37:37,964] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt... +26: [2023-05-10 12:37:37,965] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +30: [2023-05-10 12:37:37,965] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +30: [2023-05-10 12:37:37,966] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +30: [2023-05-10 12:37:37,966] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +30: [2023-05-10 12:37:37,967] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +26: [2023-05-10 12:37:37,967] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt... + 3: [2023-05-10 12:37:37,972] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt. + 3: [2023-05-10 12:37:37,973] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt. + 3: [2023-05-10 12:37:37,973] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt. +28: [2023-05-10 12:37:37,973] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt. +28: [2023-05-10 12:37:37,973] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt. +28: [2023-05-10 12:37:37,973] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt. +30: [2023-05-10 12:37:37,973] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt. +30: [2023-05-10 12:37:37,973] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt. +30: [2023-05-10 12:37:37,973] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt. +19: [2023-05-10 12:37:37,973] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt. +19: [2023-05-10 12:37:37,973] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt. + 3: [2023-05-10 12:37:37,973] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt. +28: [2023-05-10 12:37:37,974] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt. +30: [2023-05-10 12:37:37,974] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt. +19: [2023-05-10 12:37:37,974] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt. +19: [2023-05-10 12:37:37,974] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt. +19: [2023-05-10 12:37:37,986] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +28: [2023-05-10 12:37:37,986] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +28: [2023-05-10 12:37:37,989] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +28: [2023-05-10 12:37:37,989] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +19: [2023-05-10 12:37:37,989] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +28: [2023-05-10 12:37:37,989] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +19: [2023-05-10 12:37:37,991] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +19: [2023-05-10 12:37:37,991] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... + 3: [2023-05-10 12:37:37,994] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... + 3: [2023-05-10 12:37:37,994] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... + 6: [2023-05-10 12:37:37,994] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt. + 6: [2023-05-10 12:37:37,994] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt. + 6: [2023-05-10 12:37:37,994] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt. + 6: [2023-05-10 12:37:37,994] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt. + 3: [2023-05-10 12:37:37,995] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +30: [2023-05-10 12:37:37,995] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +30: [2023-05-10 12:37:37,996] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +30: [2023-05-10 12:37:37,996] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +30: [2023-05-10 12:37:37,996] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +30: [2023-05-10 12:37:37,996] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... + 3: [2023-05-10 12:37:37,997] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +23: [2023-05-10 12:37:38,001] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +23: [2023-05-10 12:37:38,001] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +23: [2023-05-10 12:37:38,001] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +23: [2023-05-10 12:37:38,001] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +23: [2023-05-10 12:37:38,002] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +30: [2023-05-10 12:37:38,002] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +30: [2023-05-10 12:37:38,002] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +30: [2023-05-10 12:37:38,002] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +23: [2023-05-10 12:37:38,003] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +23: [2023-05-10 12:37:38,003] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +23: [2023-05-10 12:37:38,003] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... + 6: [2023-05-10 12:37:38,012] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... + 6: [2023-05-10 12:37:38,013] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... + 6: [2023-05-10 12:37:38,013] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... + 6: [2023-05-10 12:37:38,013] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +30: [2023-05-10 12:37:38,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +24: [2023-05-10 12:37:38,022] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt. +24: [2023-05-10 12:37:38,022] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt. +24: [2023-05-10 12:37:38,022] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt. +24: [2023-05-10 12:37:38,022] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt. +23: [2023-05-10 12:37:38,024] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +23: [2023-05-10 12:37:38,025] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +30: [2023-05-10 12:37:38,026] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +23: [2023-05-10 12:37:38,026] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +23: [2023-05-10 12:37:38,027] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +30: [2023-05-10 12:37:38,027] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +30: [2023-05-10 12:37:38,027] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... + 3: [2023-05-10 12:37:38,028] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. + 3: [2023-05-10 12:37:38,028] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. + 3: [2023-05-10 12:37:38,029] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. + 3: [2023-05-10 12:37:38,029] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. + 3: [2023-05-10 12:37:38,032] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt... + 3: [2023-05-10 12:37:38,032] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt... + 3: [2023-05-10 12:37:38,032] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt... + 3: [2023-05-10 12:37:38,032] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt... +30: [2023-05-10 12:37:38,033] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +30: [2023-05-10 12:37:38,033] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +30: [2023-05-10 12:37:38,034] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +23: [2023-05-10 12:37:38,037] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +23: [2023-05-10 12:37:38,037] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +24: [2023-05-10 12:37:38,037] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +19: [2023-05-10 12:37:38,037] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +30: [2023-05-10 12:37:38,037] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt... +30: [2023-05-10 12:37:38,037] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt... +19: [2023-05-10 12:37:38,037] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +30: [2023-05-10 12:37:38,037] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt... +19: [2023-05-10 12:37:38,037] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +24: [2023-05-10 12:37:38,037] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +19: [2023-05-10 12:37:38,038] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +19: [2023-05-10 12:37:38,038] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +19: [2023-05-10 12:37:38,038] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +19: [2023-05-10 12:37:38,038] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +19: [2023-05-10 12:37:38,038] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +19: [2023-05-10 12:37:38,039] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +19: [2023-05-10 12:37:38,039] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +28: [2023-05-10 12:37:38,039] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +19: [2023-05-10 12:37:38,039] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +24: [2023-05-10 12:37:38,039] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +19: [2023-05-10 12:37:38,039] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +28: [2023-05-10 12:37:38,040] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +19: [2023-05-10 12:37:38,040] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt... +19: [2023-05-10 12:37:38,040] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt... +28: [2023-05-10 12:37:38,040] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +30: [2023-05-10 12:37:38,040] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +28: [2023-05-10 12:37:38,040] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +28: [2023-05-10 12:37:38,040] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +28: [2023-05-10 12:37:38,040] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +28: [2023-05-10 12:37:38,040] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +19: [2023-05-10 12:37:38,040] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt... +28: [2023-05-10 12:37:38,040] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +24: [2023-05-10 12:37:38,040] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +19: [2023-05-10 12:37:38,040] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt... +23: [2023-05-10 12:37:38,041] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +28: [2023-05-10 12:37:38,041] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt... +28: [2023-05-10 12:37:38,041] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt... +28: [2023-05-10 12:37:38,042] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +28: [2023-05-10 12:37:38,042] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt... +28: [2023-05-10 12:37:38,042] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +28: [2023-05-10 12:37:38,042] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +28: [2023-05-10 12:37:38,042] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt... +28: [2023-05-10 12:37:38,042] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +30: [2023-05-10 12:37:38,043] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt... +23: [2023-05-10 12:37:38,043] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +25: [2023-05-10 12:37:38,048] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt. +25: [2023-05-10 12:37:38,048] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt. +25: [2023-05-10 12:37:38,048] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt. +25: [2023-05-10 12:37:38,049] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt. +14: [2023-05-10 12:37:38,054] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt. +14: [2023-05-10 12:37:38,054] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt. +14: [2023-05-10 12:37:38,054] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt. +31: [2023-05-10 12:37:38,054] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt. +31: [2023-05-10 12:37:38,054] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt. +31: [2023-05-10 12:37:38,055] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt. +31: [2023-05-10 12:37:38,055] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt. +16: [2023-05-10 12:37:38,055] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt. +16: [2023-05-10 12:37:38,055] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt. +16: [2023-05-10 12:37:38,055] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt. +16: [2023-05-10 12:37:38,055] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt. +18: [2023-05-10 12:37:38,055] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt. +18: [2023-05-10 12:37:38,055] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt. +18: [2023-05-10 12:37:38,055] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt. +18: [2023-05-10 12:37:38,056] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt. +14: [2023-05-10 12:37:38,056] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt. + 9: [2023-05-10 12:37:38,056] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt. + 9: [2023-05-10 12:37:38,056] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt. + 9: [2023-05-10 12:37:38,056] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt. + 4: [2023-05-10 12:37:38,058] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt. + 4: [2023-05-10 12:37:38,058] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt. + 4: [2023-05-10 12:37:38,058] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt. + 4: [2023-05-10 12:37:38,058] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt. +23: [2023-05-10 12:37:38,058] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt. +23: [2023-05-10 12:37:38,058] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt. +23: [2023-05-10 12:37:38,058] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt. + 9: [2023-05-10 12:37:38,058] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt. +23: [2023-05-10 12:37:38,058] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt. + 7: [2023-05-10 12:37:38,058] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt. + 7: [2023-05-10 12:37:38,058] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt. + 7: [2023-05-10 12:37:38,058] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt. + 7: [2023-05-10 12:37:38,059] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt. +29: [2023-05-10 12:37:38,059] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +29: [2023-05-10 12:37:38,059] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +29: [2023-05-10 12:37:38,059] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +29: [2023-05-10 12:37:38,060] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +29: [2023-05-10 12:37:38,060] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +29: [2023-05-10 12:37:38,061] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +19: [2023-05-10 12:37:38,061] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +29: [2023-05-10 12:37:38,061] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +29: [2023-05-10 12:37:38,061] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +15: [2023-05-10 12:37:38,063] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt. +15: [2023-05-10 12:37:38,063] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt. +15: [2023-05-10 12:37:38,063] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt. +15: [2023-05-10 12:37:38,064] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt. +28: [2023-05-10 12:37:38,064] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +19: [2023-05-10 12:37:38,064] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +19: [2023-05-10 12:37:38,064] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +25: [2023-05-10 12:37:38,065] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +19: [2023-05-10 12:37:38,066] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +25: [2023-05-10 12:37:38,066] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +13: [2023-05-10 12:37:38,066] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt. +13: [2023-05-10 12:37:38,066] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt. +25: [2023-05-10 12:37:38,066] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +25: [2023-05-10 12:37:38,067] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +13: [2023-05-10 12:37:38,067] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt. +13: [2023-05-10 12:37:38,067] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt. +17: [2023-05-10 12:37:38,067] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt. +17: [2023-05-10 12:37:38,067] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt. +17: [2023-05-10 12:37:38,067] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt. +17: [2023-05-10 12:37:38,067] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt. +14: [2023-05-10 12:37:38,068] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +14: [2023-05-10 12:37:38,068] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +14: [2023-05-10 12:37:38,068] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +10: [2023-05-10 12:37:38,068] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +10: [2023-05-10 12:37:38,068] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +10: [2023-05-10 12:37:38,069] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +31: [2023-05-10 12:37:38,069] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +14: [2023-05-10 12:37:38,069] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +28: [2023-05-10 12:37:38,069] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +28: [2023-05-10 12:37:38,069] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +28: [2023-05-10 12:37:38,069] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +18: [2023-05-10 12:37:38,069] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +18: [2023-05-10 12:37:38,070] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +18: [2023-05-10 12:37:38,070] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +18: [2023-05-10 12:37:38,070] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +31: [2023-05-10 12:37:38,070] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +16: [2023-05-10 12:37:38,071] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +10: [2023-05-10 12:37:38,071] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +10: [2023-05-10 12:37:38,071] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +10: [2023-05-10 12:37:38,071] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +16: [2023-05-10 12:37:38,071] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +16: [2023-05-10 12:37:38,071] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +31: [2023-05-10 12:37:38,071] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +10: [2023-05-10 12:37:38,071] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +16: [2023-05-10 12:37:38,071] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +31: [2023-05-10 12:37:38,072] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +29: [2023-05-10 12:37:38,072] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt. +29: [2023-05-10 12:37:38,072] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt. + 4: [2023-05-10 12:37:38,073] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +29: [2023-05-10 12:37:38,073] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt. + 4: [2023-05-10 12:37:38,073] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... + 8: [2023-05-10 12:37:38,073] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. + 8: [2023-05-10 12:37:38,073] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. + 8: [2023-05-10 12:37:38,073] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. + 4: [2023-05-10 12:37:38,073] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... + 8: [2023-05-10 12:37:38,073] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. + 4: [2023-05-10 12:37:38,073] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +10: [2023-05-10 12:37:38,073] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +29: [2023-05-10 12:37:38,074] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt. + 7: [2023-05-10 12:37:38,074] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +23: [2023-05-10 12:37:38,075] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... + 7: [2023-05-10 12:37:38,075] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +19: [2023-05-10 12:37:38,075] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... + 7: [2023-05-10 12:37:38,075] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +28: [2023-05-10 12:37:38,075] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... + 8: [2023-05-10 12:37:38,076] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... + 9: [2023-05-10 12:37:38,076] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... + 8: [2023-05-10 12:37:38,076] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... + 8: [2023-05-10 12:37:38,077] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... + 8: [2023-05-10 12:37:38,077] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... + 7: [2023-05-10 12:37:38,077] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... + 9: [2023-05-10 12:37:38,078] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... + 9: [2023-05-10 12:37:38,079] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +23: [2023-05-10 12:37:38,079] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +23: [2023-05-10 12:37:38,080] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +23: [2023-05-10 12:37:38,080] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... + 9: [2023-05-10 12:37:38,081] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +19: [2023-05-10 12:37:38,081] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +19: [2023-05-10 12:37:38,081] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +28: [2023-05-10 12:37:38,082] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +28: [2023-05-10 12:37:38,082] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +28: [2023-05-10 12:37:38,082] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +17: [2023-05-10 12:37:38,083] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +15: [2023-05-10 12:37:38,084] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +17: [2023-05-10 12:37:38,085] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +19: [2023-05-10 12:37:38,085] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +29: [2023-05-10 12:37:38,085] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +13: [2023-05-10 12:37:38,085] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +13: [2023-05-10 12:37:38,085] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +15: [2023-05-10 12:37:38,087] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... + 2: [2023-05-10 12:37:38,088] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt. +13: [2023-05-10 12:37:38,088] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +15: [2023-05-10 12:37:38,088] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... + 2: [2023-05-10 12:37:38,088] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt. +13: [2023-05-10 12:37:38,088] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +29: [2023-05-10 12:37:38,088] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +15: [2023-05-10 12:37:38,088] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... + 2: [2023-05-10 12:37:38,088] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt. +29: [2023-05-10 12:37:38,088] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... + 2: [2023-05-10 12:37:38,088] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt. +17: [2023-05-10 12:37:38,088] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +17: [2023-05-10 12:37:38,088] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... + 5: [2023-05-10 12:37:38,090] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt. + 5: [2023-05-10 12:37:38,090] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt. + 5: [2023-05-10 12:37:38,091] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt. + 5: [2023-05-10 12:37:38,091] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt. +29: [2023-05-10 12:37:38,091] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +29: [2023-05-10 12:37:38,091] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +29: [2023-05-10 12:37:38,092] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +27: [2023-05-10 12:37:38,092] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt. +27: [2023-05-10 12:37:38,092] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt. +27: [2023-05-10 12:37:38,092] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt. +10: [2023-05-10 12:37:38,093] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +21: [2023-05-10 12:37:38,093] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt. +21: [2023-05-10 12:37:38,093] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt. +27: [2023-05-10 12:37:38,093] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt. +21: [2023-05-10 12:37:38,093] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt. +21: [2023-05-10 12:37:38,093] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt. + 7: [2023-05-10 12:37:38,094] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. + 7: [2023-05-10 12:37:38,094] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. + 7: [2023-05-10 12:37:38,094] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. + 7: [2023-05-10 12:37:38,094] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. + 8: [2023-05-10 12:37:38,094] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt. + 8: [2023-05-10 12:37:38,095] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt. + 8: [2023-05-10 12:37:38,095] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt. + 8: [2023-05-10 12:37:38,095] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt. + 7: [2023-05-10 12:37:38,096] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +24: [2023-05-10 12:37:38,096] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +24: [2023-05-10 12:37:38,096] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +24: [2023-05-10 12:37:38,096] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. + 7: [2023-05-10 12:37:38,096] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +24: [2023-05-10 12:37:38,096] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +24: [2023-05-10 12:37:38,096] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +24: [2023-05-10 12:37:38,096] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. + 7: [2023-05-10 12:37:38,096] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +29: [2023-05-10 12:37:38,096] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +29: [2023-05-10 12:37:38,096] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +24: [2023-05-10 12:37:38,096] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. + 7: [2023-05-10 12:37:38,096] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +24: [2023-05-10 12:37:38,096] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +11: [2023-05-10 12:37:38,096] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt. +11: [2023-05-10 12:37:38,096] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt. +11: [2023-05-10 12:37:38,096] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt. +31: [2023-05-10 12:37:38,096] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +10: [2023-05-10 12:37:38,097] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt. +10: [2023-05-10 12:37:38,097] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt. +10: [2023-05-10 12:37:38,097] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt. +11: [2023-05-10 12:37:38,097] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt. +10: [2023-05-10 12:37:38,097] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_01-model_01-model_states.pt. +10: [2023-05-10 12:37:38,097] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +24: [2023-05-10 12:37:38,098] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +24: [2023-05-10 12:37:38,098] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt... +24: [2023-05-10 12:37:38,098] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt... +24: [2023-05-10 12:37:38,098] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt... +24: [2023-05-10 12:37:38,098] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +24: [2023-05-10 12:37:38,098] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt... +29: [2023-05-10 12:37:38,098] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +24: [2023-05-10 12:37:38,098] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +31: [2023-05-10 12:37:38,098] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt... +24: [2023-05-10 12:37:38,098] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +10: [2023-05-10 12:37:38,098] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +10: [2023-05-10 12:37:38,100] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +31: [2023-05-10 12:37:38,103] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +31: [2023-05-10 12:37:38,103] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +31: [2023-05-10 12:37:38,103] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +29: [2023-05-10 12:37:38,104] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +23: [2023-05-10 12:37:38,104] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +12: [2023-05-10 12:37:38,105] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. + 7: [2023-05-10 12:37:38,104] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. + 8: [2023-05-10 12:37:38,105] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +12: [2023-05-10 12:37:38,105] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +12: [2023-05-10 12:37:38,105] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. + 7: [2023-05-10 12:37:38,105] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +12: [2023-05-10 12:37:38,105] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +12: [2023-05-10 12:37:38,105] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +12: [2023-05-10 12:37:38,105] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +12: [2023-05-10 12:37:38,105] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +12: [2023-05-10 12:37:38,105] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +31: [2023-05-10 12:37:38,105] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt... + 7: [2023-05-10 12:37:38,105] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. + 7: [2023-05-10 12:37:38,105] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +31: [2023-05-10 12:37:38,106] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt... +31: [2023-05-10 12:37:38,106] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt... + 7: [2023-05-10 12:37:38,106] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt... + 2: [2023-05-10 12:37:38,106] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +12: [2023-05-10 12:37:38,107] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt... +21: [2023-05-10 12:37:38,107] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +12: [2023-05-10 12:37:38,107] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... + 2: [2023-05-10 12:37:38,107] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... + 2: [2023-05-10 12:37:38,107] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +21: [2023-05-10 12:37:38,107] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... + 7: [2023-05-10 12:37:38,107] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt... +12: [2023-05-10 12:37:38,107] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +12: [2023-05-10 12:37:38,107] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt... + 2: [2023-05-10 12:37:38,107] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... + 7: [2023-05-10 12:37:38,107] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt... + 7: [2023-05-10 12:37:38,107] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt... +23: [2023-05-10 12:37:38,107] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +12: [2023-05-10 12:37:38,108] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt... +12: [2023-05-10 12:37:38,108] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +12: [2023-05-10 12:37:38,108] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +12: [2023-05-10 12:37:38,108] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt... +23: [2023-05-10 12:37:38,108] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt... +23: [2023-05-10 12:37:38,109] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt... +21: [2023-05-10 12:37:38,109] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +21: [2023-05-10 12:37:38,109] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +10: [2023-05-10 12:37:38,110] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +15: [2023-05-10 12:37:38,110] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +15: [2023-05-10 12:37:38,110] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +23: [2023-05-10 12:37:38,110] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +23: [2023-05-10 12:37:38,110] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +27: [2023-05-10 12:37:38,110] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +15: [2023-05-10 12:37:38,110] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +15: [2023-05-10 12:37:38,110] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +29: [2023-05-10 12:37:38,110] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +29: [2023-05-10 12:37:38,110] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +27: [2023-05-10 12:37:38,111] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +27: [2023-05-10 12:37:38,111] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... + 5: [2023-05-10 12:37:38,112] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +27: [2023-05-10 12:37:38,112] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... + 8: [2023-05-10 12:37:38,112] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. + 8: [2023-05-10 12:37:38,112] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. + 8: [2023-05-10 12:37:38,112] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +23: [2023-05-10 12:37:38,112] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt... +23: [2023-05-10 12:37:38,112] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt... +11: [2023-05-10 12:37:38,113] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +15: [2023-05-10 12:37:38,113] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +15: [2023-05-10 12:37:38,114] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +15: [2023-05-10 12:37:38,114] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... + 5: [2023-05-10 12:37:38,114] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... + 5: [2023-05-10 12:37:38,114] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... + 5: [2023-05-10 12:37:38,114] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +15: [2023-05-10 12:37:38,114] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... + 8: [2023-05-10 12:37:38,115] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +11: [2023-05-10 12:37:38,116] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... + 8: [2023-05-10 12:37:38,117] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +10: [2023-05-10 12:37:38,117] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +10: [2023-05-10 12:37:38,117] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +15: [2023-05-10 12:37:38,118] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. + 8: [2023-05-10 12:37:38,118] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... + 8: [2023-05-10 12:37:38,118] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +15: [2023-05-10 12:37:38,119] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +24: [2023-05-10 12:37:38,119] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +10: [2023-05-10 12:37:38,119] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +10: [2023-05-10 12:37:38,120] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... + 7: [2023-05-10 12:37:38,120] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +10: [2023-05-10 12:37:38,120] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +15: [2023-05-10 12:37:38,120] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +15: [2023-05-10 12:37:38,120] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +24: [2023-05-10 12:37:38,120] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +10: [2023-05-10 12:37:38,121] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +11: [2023-05-10 12:37:38,122] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +24: [2023-05-10 12:37:38,122] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +24: [2023-05-10 12:37:38,122] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +11: [2023-05-10 12:37:38,122] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +15: [2023-05-10 12:37:38,122] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt... +15: [2023-05-10 12:37:38,122] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt... +29: [2023-05-10 12:37:38,122] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +29: [2023-05-10 12:37:38,122] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +10: [2023-05-10 12:37:38,123] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +15: [2023-05-10 12:37:38,123] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt... +15: [2023-05-10 12:37:38,123] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt... +29: [2023-05-10 12:37:38,124] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt... +29: [2023-05-10 12:37:38,124] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt... + 7: [2023-05-10 12:37:38,125] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. + 7: [2023-05-10 12:37:38,125] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. + 7: [2023-05-10 12:37:38,125] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +29: [2023-05-10 12:37:38,126] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +29: [2023-05-10 12:37:38,126] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. + 8: [2023-05-10 12:37:38,126] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +29: [2023-05-10 12:37:38,128] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt... +29: [2023-05-10 12:37:38,128] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt... +27: [2023-05-10 12:37:38,129] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +16: [2023-05-10 12:37:38,129] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +16: [2023-05-10 12:37:38,129] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +16: [2023-05-10 12:37:38,129] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +16: [2023-05-10 12:37:38,129] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +16: [2023-05-10 12:37:38,129] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +16: [2023-05-10 12:37:38,129] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +16: [2023-05-10 12:37:38,129] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +27: [2023-05-10 12:37:38,129] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +27: [2023-05-10 12:37:38,129] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +27: [2023-05-10 12:37:38,129] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +16: [2023-05-10 12:37:38,129] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. + 4: [2023-05-10 12:37:38,129] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. + 4: [2023-05-10 12:37:38,130] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. + 4: [2023-05-10 12:37:38,130] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. + 4: [2023-05-10 12:37:38,130] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. + 4: [2023-05-10 12:37:38,130] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. + 4: [2023-05-10 12:37:38,130] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. + 4: [2023-05-10 12:37:38,130] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. + 4: [2023-05-10 12:37:38,130] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +16: [2023-05-10 12:37:38,130] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +16: [2023-05-10 12:37:38,131] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +16: [2023-05-10 12:37:38,131] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +16: [2023-05-10 12:37:38,131] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +16: [2023-05-10 12:37:38,131] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt... +16: [2023-05-10 12:37:38,131] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt... +16: [2023-05-10 12:37:38,131] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt... +16: [2023-05-10 12:37:38,131] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt... + 4: [2023-05-10 12:37:38,131] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt... + 4: [2023-05-10 12:37:38,132] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt... + 4: [2023-05-10 12:37:38,132] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt... + 4: [2023-05-10 12:37:38,132] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... + 4: [2023-05-10 12:37:38,132] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt... + 4: [2023-05-10 12:37:38,132] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... + 4: [2023-05-10 12:37:38,132] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... + 4: [2023-05-10 12:37:38,132] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... + 5: [2023-05-10 12:37:38,132] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. + 5: [2023-05-10 12:37:38,132] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +27: [2023-05-10 12:37:38,132] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +27: [2023-05-10 12:37:38,132] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... + 6: [2023-05-10 12:37:38,132] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. + 6: [2023-05-10 12:37:38,132] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. + 6: [2023-05-10 12:37:38,132] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. + 6: [2023-05-10 12:37:38,132] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. + 5: [2023-05-10 12:37:38,132] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. + 5: [2023-05-10 12:37:38,132] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. + 6: [2023-05-10 12:37:38,132] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. + 6: [2023-05-10 12:37:38,132] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. + 6: [2023-05-10 12:37:38,132] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. + 6: [2023-05-10 12:37:38,133] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +12: [2023-05-10 12:37:38,132] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +12: [2023-05-10 12:37:38,132] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +27: [2023-05-10 12:37:38,133] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +12: [2023-05-10 12:37:38,133] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +12: [2023-05-10 12:37:38,133] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +27: [2023-05-10 12:37:38,133] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... + 7: [2023-05-10 12:37:38,134] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... + 0: [2023-05-10 12:37:38,134] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +13: [2023-05-10 12:37:38,135] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +13: [2023-05-10 12:37:38,135] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +13: [2023-05-10 12:37:38,135] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +13: [2023-05-10 12:37:38,135] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +13: [2023-05-10 12:37:38,135] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +13: [2023-05-10 12:37:38,135] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +13: [2023-05-10 12:37:38,135] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. + 0: [2023-05-10 12:37:38,136] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. + 0: [2023-05-10 12:37:38,136] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. + 0: [2023-05-10 12:37:38,136] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. + 0: [2023-05-10 12:37:38,136] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +13: [2023-05-10 12:37:38,136] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. + 6: [2023-05-10 12:37:38,135] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... + 6: [2023-05-10 12:37:38,135] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... + 6: [2023-05-10 12:37:38,135] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... + 6: [2023-05-10 12:37:38,136] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... + 0: [2023-05-10 12:37:38,136] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. + 0: [2023-05-10 12:37:38,136] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. + 5: [2023-05-10 12:37:38,135] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... + 5: [2023-05-10 12:37:38,135] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... + 6: [2023-05-10 12:37:38,136] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt... + 6: [2023-05-10 12:37:38,136] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt... + 0: [2023-05-10 12:37:38,136] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. + 6: [2023-05-10 12:37:38,136] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt... + 5: [2023-05-10 12:37:38,136] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +14: [2023-05-10 12:37:38,136] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. + 1: [2023-05-10 12:37:38,136] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. + 1: [2023-05-10 12:37:38,136] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. + 5: [2023-05-10 12:37:38,136] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... + 6: [2023-05-10 12:37:38,136] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt... +14: [2023-05-10 12:37:38,136] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. + 1: [2023-05-10 12:37:38,136] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +25: [2023-05-10 12:37:38,136] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. + 8: [2023-05-10 12:37:38,136] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +25: [2023-05-10 12:37:38,136] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. + 1: [2023-05-10 12:37:38,136] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +14: [2023-05-10 12:37:38,136] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. + 1: [2023-05-10 12:37:38,137] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. + 1: [2023-05-10 12:37:38,137] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. + 1: [2023-05-10 12:37:38,137] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +25: [2023-05-10 12:37:38,137] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +25: [2023-05-10 12:37:38,137] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +25: [2023-05-10 12:37:38,137] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +25: [2023-05-10 12:37:38,137] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +14: [2023-05-10 12:37:38,137] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +14: [2023-05-10 12:37:38,137] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +25: [2023-05-10 12:37:38,137] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +14: [2023-05-10 12:37:38,137] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +14: [2023-05-10 12:37:38,137] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +25: [2023-05-10 12:37:38,137] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +24: [2023-05-10 12:37:38,137] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... + 1: [2023-05-10 12:37:38,137] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +24: [2023-05-10 12:37:38,137] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +14: [2023-05-10 12:37:38,137] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. + 8: [2023-05-10 12:37:38,137] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... + 8: [2023-05-10 12:37:38,137] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... + 0: [2023-05-10 12:37:38,137] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt... +24: [2023-05-10 12:37:38,137] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +13: [2023-05-10 12:37:38,138] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +14: [2023-05-10 12:37:38,138] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +25: [2023-05-10 12:37:38,138] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +13: [2023-05-10 12:37:38,138] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt... +14: [2023-05-10 12:37:38,138] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt... +14: [2023-05-10 12:37:38,138] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt... +25: [2023-05-10 12:37:38,138] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +17: [2023-05-10 12:37:38,138] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +17: [2023-05-10 12:37:38,138] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +14: [2023-05-10 12:37:38,138] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +25: [2023-05-10 12:37:38,138] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt... +25: [2023-05-10 12:37:38,138] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +25: [2023-05-10 12:37:38,138] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt... +13: [2023-05-10 12:37:38,138] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt... +17: [2023-05-10 12:37:38,138] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +14: [2023-05-10 12:37:38,138] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +14: [2023-05-10 12:37:38,138] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt... +17: [2023-05-10 12:37:38,138] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +17: [2023-05-10 12:37:38,139] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +17: [2023-05-10 12:37:38,139] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +17: [2023-05-10 12:37:38,139] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +14: [2023-05-10 12:37:38,139] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt... +14: [2023-05-10 12:37:38,139] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +25: [2023-05-10 12:37:38,139] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +17: [2023-05-10 12:37:38,139] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +25: [2023-05-10 12:37:38,139] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt... +25: [2023-05-10 12:37:38,139] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt... +13: [2023-05-10 12:37:38,140] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +13: [2023-05-10 12:37:38,140] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... + 1: [2023-05-10 12:37:38,140] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... + 1: [2023-05-10 12:37:38,140] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +13: [2023-05-10 12:37:38,140] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +13: [2023-05-10 12:37:38,140] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt... +13: [2023-05-10 12:37:38,140] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt... + 7: [2023-05-10 12:37:38,140] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... + 1: [2023-05-10 12:37:38,140] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt... + 1: [2023-05-10 12:37:38,140] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt... +17: [2023-05-10 12:37:38,140] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +17: [2023-05-10 12:37:38,141] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +17: [2023-05-10 12:37:38,141] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt... +17: [2023-05-10 12:37:38,141] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt... + 7: [2023-05-10 12:37:38,141] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +17: [2023-05-10 12:37:38,141] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +17: [2023-05-10 12:37:38,141] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... + 1: [2023-05-10 12:37:38,141] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... + 1: [2023-05-10 12:37:38,141] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt... + 7: [2023-05-10 12:37:38,141] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... + 9: [2023-05-10 12:37:38,141] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. + 9: [2023-05-10 12:37:38,141] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. + 1: [2023-05-10 12:37:38,141] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... + 2: [2023-05-10 12:37:38,141] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. + 2: [2023-05-10 12:37:38,141] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. + 2: [2023-05-10 12:37:38,141] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. + 2: [2023-05-10 12:37:38,141] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +15: [2023-05-10 12:37:38,141] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. + 2: [2023-05-10 12:37:38,141] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. + 2: [2023-05-10 12:37:38,141] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. + 9: [2023-05-10 12:37:38,141] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. + 9: [2023-05-10 12:37:38,141] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. + 1: [2023-05-10 12:37:38,141] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt... + 0: [2023-05-10 12:37:38,142] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +15: [2023-05-10 12:37:38,141] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. + 0: [2023-05-10 12:37:38,142] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt... + 0: [2023-05-10 12:37:38,142] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... + 9: [2023-05-10 12:37:38,142] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. + 9: [2023-05-10 12:37:38,142] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. + 9: [2023-05-10 12:37:38,142] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. + 2: [2023-05-10 12:37:38,142] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +17: [2023-05-10 12:37:38,141] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt... +17: [2023-05-10 12:37:38,142] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt... + 0: [2023-05-10 12:37:38,142] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... + 2: [2023-05-10 12:37:38,142] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. + 9: [2023-05-10 12:37:38,142] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. + 0: [2023-05-10 12:37:38,142] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt... + 0: [2023-05-10 12:37:38,142] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... + 0: [2023-05-10 12:37:38,142] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt... +18: [2023-05-10 12:37:38,142] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +18: [2023-05-10 12:37:38,142] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +18: [2023-05-10 12:37:38,142] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +18: [2023-05-10 12:37:38,142] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +18: [2023-05-10 12:37:38,142] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +18: [2023-05-10 12:37:38,142] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +18: [2023-05-10 12:37:38,142] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +18: [2023-05-10 12:37:38,143] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +15: [2023-05-10 12:37:38,143] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +15: [2023-05-10 12:37:38,143] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +27: [2023-05-10 12:37:38,143] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +18: [2023-05-10 12:37:38,144] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt... +18: [2023-05-10 12:37:38,144] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt... + 2: [2023-05-10 12:37:38,144] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +24: [2023-05-10 12:37:38,144] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... + 2: [2023-05-10 12:37:38,145] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt... + 2: [2023-05-10 12:37:38,145] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt... + 9: [2023-05-10 12:37:38,144] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... + 2: [2023-05-10 12:37:38,145] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... + 5: [2023-05-10 12:37:38,144] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. + 2: [2023-05-10 12:37:38,145] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt... + 2: [2023-05-10 12:37:38,145] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... + 2: [2023-05-10 12:37:38,145] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt... + 2: [2023-05-10 12:37:38,145] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +18: [2023-05-10 12:37:38,145] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +18: [2023-05-10 12:37:38,145] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... + 9: [2023-05-10 12:37:38,145] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt... + 9: [2023-05-10 12:37:38,145] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt... +12: [2023-05-10 12:37:38,145] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +12: [2023-05-10 12:37:38,145] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +18: [2023-05-10 12:37:38,145] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt... + 9: [2023-05-10 12:37:38,145] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +18: [2023-05-10 12:37:38,146] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... + 9: [2023-05-10 12:37:38,146] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt... + 9: [2023-05-10 12:37:38,146] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt... +18: [2023-05-10 12:37:38,146] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... + 9: [2023-05-10 12:37:38,146] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... + 9: [2023-05-10 12:37:38,146] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +18: [2023-05-10 12:37:38,146] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt... +12: [2023-05-10 12:37:38,146] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +27: [2023-05-10 12:37:38,146] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +27: [2023-05-10 12:37:38,146] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +27: [2023-05-10 12:37:38,146] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +27: [2023-05-10 12:37:38,147] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt... +10: [2023-05-10 12:37:38,147] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +10: [2023-05-10 12:37:38,147] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +12: [2023-05-10 12:37:38,148] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... + 5: [2023-05-10 12:37:38,148] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt... +10: [2023-05-10 12:37:38,150] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt... +10: [2023-05-10 12:37:38,150] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt... +27: [2023-05-10 12:37:38,150] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt... +27: [2023-05-10 12:37:38,150] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt... +27: [2023-05-10 12:37:38,150] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt... + 5: [2023-05-10 12:37:38,151] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +10: [2023-05-10 12:37:38,151] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +16: [2023-05-10 12:37:38,153] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. + 4: [2023-05-10 12:37:38,153] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. + 5: [2023-05-10 12:37:38,153] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt... +10: [2023-05-10 12:37:38,154] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt... +16: [2023-05-10 12:37:38,154] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. + 8: [2023-05-10 12:37:38,154] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. + 8: [2023-05-10 12:37:38,154] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +11: [2023-05-10 12:37:38,156] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. + 5: [2023-05-10 12:37:38,155] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. + 5: [2023-05-10 12:37:38,155] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +11: [2023-05-10 12:37:38,156] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +11: [2023-05-10 12:37:38,156] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +11: [2023-05-10 12:37:38,156] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +11: [2023-05-10 12:37:38,156] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +11: [2023-05-10 12:37:38,156] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +11: [2023-05-10 12:37:38,156] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +11: [2023-05-10 12:37:38,156] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. + 4: [2023-05-10 12:37:38,156] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +16: [2023-05-10 12:37:38,158] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +16: [2023-05-10 12:37:38,158] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +10: [2023-05-10 12:37:38,158] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +11: [2023-05-10 12:37:38,158] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt... + 8: [2023-05-10 12:37:38,158] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt... + 8: [2023-05-10 12:37:38,158] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt... +11: [2023-05-10 12:37:38,159] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt... +27: [2023-05-10 12:37:38,159] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. + 4: [2023-05-10 12:37:38,159] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. + 5: [2023-05-10 12:37:38,159] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt... + 5: [2023-05-10 12:37:38,159] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt... +15: [2023-05-10 12:37:38,159] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... + 6: [2023-05-10 12:37:38,159] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +14: [2023-05-10 12:37:38,159] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +11: [2023-05-10 12:37:38,160] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +11: [2023-05-10 12:37:38,160] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +11: [2023-05-10 12:37:38,160] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt... +13: [2023-05-10 12:37:38,160] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +25: [2023-05-10 12:37:38,161] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +10: [2023-05-10 12:37:38,161] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt... +11: [2023-05-10 12:37:38,161] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt... +15: [2023-05-10 12:37:38,161] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +11: [2023-05-10 12:37:38,161] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +27: [2023-05-10 12:37:38,160] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +11: [2023-05-10 12:37:38,161] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +14: [2023-05-10 12:37:38,161] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. + 8: [2023-05-10 12:37:38,160] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. + 8: [2023-05-10 12:37:38,161] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. + 4: [2023-05-10 12:37:38,161] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +25: [2023-05-10 12:37:38,162] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. + 6: [2023-05-10 12:37:38,161] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. + 6: [2023-05-10 12:37:38,161] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +17: [2023-05-10 12:37:38,162] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +14: [2023-05-10 12:37:38,162] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +14: [2023-05-10 12:37:38,162] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +17: [2023-05-10 12:37:38,162] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +25: [2023-05-10 12:37:38,163] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +25: [2023-05-10 12:37:38,163] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +15: [2023-05-10 12:37:38,163] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +15: [2023-05-10 12:37:38,163] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... + 6: [2023-05-10 12:37:38,164] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. + 8: [2023-05-10 12:37:38,164] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt... + 8: [2023-05-10 12:37:38,164] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt... + 4: [2023-05-10 12:37:38,165] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +27: [2023-05-10 12:37:38,165] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. + 2: [2023-05-10 12:37:38,166] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. + 2: [2023-05-10 12:37:38,166] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +27: [2023-05-10 12:37:38,166] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +31: [2023-05-10 12:37:38,167] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +31: [2023-05-10 12:37:38,167] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +31: [2023-05-10 12:37:38,167] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +17: [2023-05-10 12:37:38,166] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +17: [2023-05-10 12:37:38,166] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +16: [2023-05-10 12:37:38,167] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... + 1: [2023-05-10 12:37:38,167] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. + 1: [2023-05-10 12:37:38,167] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. + 9: [2023-05-10 12:37:38,167] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +31: [2023-05-10 12:37:38,167] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. + 5: [2023-05-10 12:37:38,167] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. + 5: [2023-05-10 12:37:38,167] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +16: [2023-05-10 12:37:38,168] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +31: [2023-05-10 12:37:38,169] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +31: [2023-05-10 12:37:38,169] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... + 1: [2023-05-10 12:37:38,169] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. + 1: [2023-05-10 12:37:38,169] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +31: [2023-05-10 12:37:38,169] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... + 2: [2023-05-10 12:37:38,169] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +31: [2023-05-10 12:37:38,170] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... + 5: [2023-05-10 12:37:38,170] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. + 5: [2023-05-10 12:37:38,170] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +13: [2023-05-10 12:37:38,169] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +13: [2023-05-10 12:37:38,169] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +13: [2023-05-10 12:37:38,169] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +16: [2023-05-10 12:37:38,170] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... + 9: [2023-05-10 12:37:38,171] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. + 4: [2023-05-10 12:37:38,172] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... + 9: [2023-05-10 12:37:38,172] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. + 9: [2023-05-10 12:37:38,172] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +16: [2023-05-10 12:37:38,172] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... + 2: [2023-05-10 12:37:38,173] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +13: [2023-05-10 12:37:38,174] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... + 6: [2023-05-10 12:37:38,174] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +25: [2023-05-10 12:37:38,174] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +18: [2023-05-10 12:37:38,173] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +18: [2023-05-10 12:37:38,173] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +18: [2023-05-10 12:37:38,173] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +18: [2023-05-10 12:37:38,173] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +14: [2023-05-10 12:37:38,174] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +25: [2023-05-10 12:37:38,174] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +14: [2023-05-10 12:37:38,174] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... + 6: [2023-05-10 12:37:38,175] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... + 6: [2023-05-10 12:37:38,175] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +14: [2023-05-10 12:37:38,175] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +14: [2023-05-10 12:37:38,175] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... + 4: [2023-05-10 12:37:38,175] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... + 0: [2023-05-10 12:37:38,175] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. + 0: [2023-05-10 12:37:38,175] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. + 0: [2023-05-10 12:37:38,175] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. + 0: [2023-05-10 12:37:38,175] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. + 4: [2023-05-10 12:37:38,175] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +17: [2023-05-10 12:37:38,176] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +25: [2023-05-10 12:37:38,176] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +25: [2023-05-10 12:37:38,177] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +17: [2023-05-10 12:37:38,177] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +27: [2023-05-10 12:37:38,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... + 6: [2023-05-10 12:37:38,180] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... + 9: [2023-05-10 12:37:38,181] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... + 2: [2023-05-10 12:37:38,181] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... + 2: [2023-05-10 12:37:38,181] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +27: [2023-05-10 12:37:38,181] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +17: [2023-05-10 12:37:38,184] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +17: [2023-05-10 12:37:38,184] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +11: [2023-05-10 12:37:38,184] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +11: [2023-05-10 12:37:38,184] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +11: [2023-05-10 12:37:38,186] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +11: [2023-05-10 12:37:38,186] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +27: [2023-05-10 12:37:38,187] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +27: [2023-05-10 12:37:38,188] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +13: [2023-05-10 12:37:38,188] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +13: [2023-05-10 12:37:38,188] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +13: [2023-05-10 12:37:38,189] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +18: [2023-05-10 12:37:38,189] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... + 5: [2023-05-10 12:37:38,189] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... + 5: [2023-05-10 12:37:38,189] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +18: [2023-05-10 12:37:38,189] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +18: [2023-05-10 12:37:38,190] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... + 5: [2023-05-10 12:37:38,190] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... + 5: [2023-05-10 12:37:38,190] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... + 2: [2023-05-10 12:37:38,190] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +18: [2023-05-10 12:37:38,190] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... + 1: [2023-05-10 12:37:38,191] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... + 1: [2023-05-10 12:37:38,191] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... + 1: [2023-05-10 12:37:38,191] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... + 1: [2023-05-10 12:37:38,191] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... + 9: [2023-05-10 12:37:38,192] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... + 2: [2023-05-10 12:37:38,193] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +31: [2023-05-10 12:37:38,193] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. + 9: [2023-05-10 12:37:38,194] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... + 9: [2023-05-10 12:37:38,195] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +31: [2023-05-10 12:37:38,195] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +31: [2023-05-10 12:37:38,196] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +31: [2023-05-10 12:37:38,196] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. + 0: [2023-05-10 12:37:38,197] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... + 0: [2023-05-10 12:37:38,197] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... + 0: [2023-05-10 12:37:38,197] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... + 0: [2023-05-10 12:37:38,197] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... + 3: [2023-05-10 12:37:38,198] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. + 3: [2023-05-10 12:37:38,198] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. + 3: [2023-05-10 12:37:38,198] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. + 3: [2023-05-10 12:37:38,199] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +11: [2023-05-10 12:37:38,201] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +11: [2023-05-10 12:37:38,201] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +22: [2023-05-10 12:37:38,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt. +22: [2023-05-10 12:37:38,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt. +22: [2023-05-10 12:37:38,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt. +22: [2023-05-10 12:37:38,202] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt. + 3: [2023-05-10 12:37:38,202] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... + 3: [2023-05-10 12:37:38,203] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +20: [2023-05-10 12:37:38,204] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt. +20: [2023-05-10 12:37:38,204] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt. + 3: [2023-05-10 12:37:38,204] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +20: [2023-05-10 12:37:38,204] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt. +20: [2023-05-10 12:37:38,204] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt. + 3: [2023-05-10 12:37:38,204] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +31: [2023-05-10 12:37:38,205] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +11: [2023-05-10 12:37:38,205] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +11: [2023-05-10 12:37:38,205] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +31: [2023-05-10 12:37:38,207] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +20: [2023-05-10 12:37:38,207] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +31: [2023-05-10 12:37:38,207] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +20: [2023-05-10 12:37:38,207] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +20: [2023-05-10 12:37:38,207] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +31: [2023-05-10 12:37:38,207] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +20: [2023-05-10 12:37:38,207] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +20: [2023-05-10 12:37:38,210] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +20: [2023-05-10 12:37:38,210] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +20: [2023-05-10 12:37:38,210] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +20: [2023-05-10 12:37:38,210] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +30: [2023-05-10 12:37:38,214] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +30: [2023-05-10 12:37:38,214] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +30: [2023-05-10 12:37:38,215] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +30: [2023-05-10 12:37:38,215] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +26: [2023-05-10 12:37:38,216] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +26: [2023-05-10 12:37:38,216] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +26: [2023-05-10 12:37:38,217] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +26: [2023-05-10 12:37:38,217] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +20: [2023-05-10 12:37:38,217] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +23: [2023-05-10 12:37:38,217] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +23: [2023-05-10 12:37:38,217] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +23: [2023-05-10 12:37:38,217] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +23: [2023-05-10 12:37:38,217] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +30: [2023-05-10 12:37:38,218] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +20: [2023-05-10 12:37:38,218] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +21: [2023-05-10 12:37:38,218] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +21: [2023-05-10 12:37:38,218] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +21: [2023-05-10 12:37:38,218] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +21: [2023-05-10 12:37:38,218] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +26: [2023-05-10 12:37:38,219] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +22: [2023-05-10 12:37:38,219] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +21: [2023-05-10 12:37:38,219] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +21: [2023-05-10 12:37:38,219] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +21: [2023-05-10 12:37:38,219] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +26: [2023-05-10 12:37:38,219] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +23: [2023-05-10 12:37:38,219] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +23: [2023-05-10 12:37:38,219] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +26: [2023-05-10 12:37:38,219] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +21: [2023-05-10 12:37:38,219] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +22: [2023-05-10 12:37:38,219] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +26: [2023-05-10 12:37:38,219] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +23: [2023-05-10 12:37:38,220] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +22: [2023-05-10 12:37:38,220] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +22: [2023-05-10 12:37:38,220] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +30: [2023-05-10 12:37:38,220] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +20: [2023-05-10 12:37:38,220] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +23: [2023-05-10 12:37:38,220] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +30: [2023-05-10 12:37:38,221] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +30: [2023-05-10 12:37:38,221] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +21: [2023-05-10 12:37:38,221] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +21: [2023-05-10 12:37:38,221] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +21: [2023-05-10 12:37:38,221] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +21: [2023-05-10 12:37:38,222] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt... +21: [2023-05-10 12:37:38,222] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt... +21: [2023-05-10 12:37:38,222] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt... +21: [2023-05-10 12:37:38,222] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt... +21: [2023-05-10 12:37:38,222] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt... +20: [2023-05-10 12:37:38,222] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... + 3: [2023-05-10 12:37:38,234] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. + 3: [2023-05-10 12:37:38,239] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. + 3: [2023-05-10 12:37:38,239] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. + 3: [2023-05-10 12:37:38,239] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +20: [2023-05-10 12:37:38,243] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +20: [2023-05-10 12:37:38,243] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +20: [2023-05-10 12:37:38,243] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +30: [2023-05-10 12:37:38,244] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +26: [2023-05-10 12:37:38,244] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +23: [2023-05-10 12:37:38,244] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +26: [2023-05-10 12:37:38,245] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +21: [2023-05-10 12:37:38,246] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +20: [2023-05-10 12:37:38,245] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +23: [2023-05-10 12:37:38,246] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +21: [2023-05-10 12:37:38,247] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. + 3: [2023-05-10 12:37:38,246] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +20: [2023-05-10 12:37:38,248] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt... +26: [2023-05-10 12:37:38,248] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +26: [2023-05-10 12:37:38,248] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +22: [2023-05-10 12:37:38,248] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +22: [2023-05-10 12:37:38,248] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +22: [2023-05-10 12:37:38,248] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +22: [2023-05-10 12:37:38,248] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +22: [2023-05-10 12:37:38,248] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +23: [2023-05-10 12:37:38,248] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +20: [2023-05-10 12:37:38,249] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +21: [2023-05-10 12:37:38,249] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +23: [2023-05-10 12:37:38,250] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +21: [2023-05-10 12:37:38,250] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_00-model_states.pt. +22: [2023-05-10 12:37:38,250] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +22: [2023-05-10 12:37:38,250] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +22: [2023-05-10 12:37:38,251] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +28: [2023-05-10 12:37:38,251] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +28: [2023-05-10 12:37:38,251] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +28: [2023-05-10 12:37:38,251] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +28: [2023-05-10 12:37:38,252] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +22: [2023-05-10 12:37:38,252] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt... +22: [2023-05-10 12:37:38,252] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +22: [2023-05-10 12:37:38,252] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +20: [2023-05-10 12:37:38,252] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +22: [2023-05-10 12:37:38,252] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... + 3: [2023-05-10 12:37:38,253] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +22: [2023-05-10 12:37:38,253] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +20: [2023-05-10 12:37:38,253] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +28: [2023-05-10 12:37:38,253] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +20: [2023-05-10 12:37:38,253] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +22: [2023-05-10 12:37:38,254] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt... + 3: [2023-05-10 12:37:38,254] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +28: [2023-05-10 12:37:38,254] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +23: [2023-05-10 12:37:38,254] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +22: [2023-05-10 12:37:38,254] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt... +28: [2023-05-10 12:37:38,254] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... + 3: [2023-05-10 12:37:38,254] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +20: [2023-05-10 12:37:38,254] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +28: [2023-05-10 12:37:38,254] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +22: [2023-05-10 12:37:38,254] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt... +30: [2023-05-10 12:37:38,254] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +30: [2023-05-10 12:37:38,254] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +20: [2023-05-10 12:37:38,254] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +20: [2023-05-10 12:37:38,255] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt... +23: [2023-05-10 12:37:38,255] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +30: [2023-05-10 12:37:38,255] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +30: [2023-05-10 12:37:38,255] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +26: [2023-05-10 12:37:38,256] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +26: [2023-05-10 12:37:38,256] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +20: [2023-05-10 12:37:38,257] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +26: [2023-05-10 12:37:38,258] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +26: [2023-05-10 12:37:38,258] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +23: [2023-05-10 12:37:38,258] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +20: [2023-05-10 12:37:38,259] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt... +21: [2023-05-10 12:37:38,260] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +21: [2023-05-10 12:37:38,260] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +20: [2023-05-10 12:37:38,261] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +19: [2023-05-10 12:37:38,261] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +19: [2023-05-10 12:37:38,261] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +23: [2023-05-10 12:37:38,261] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +19: [2023-05-10 12:37:38,261] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +19: [2023-05-10 12:37:38,261] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +21: [2023-05-10 12:37:38,261] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +20: [2023-05-10 12:37:38,262] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt... +19: [2023-05-10 12:37:38,263] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +19: [2023-05-10 12:37:38,263] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +19: [2023-05-10 12:37:38,263] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +19: [2023-05-10 12:37:38,264] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +21: [2023-05-10 12:37:38,265] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +29: [2023-05-10 12:37:38,266] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +29: [2023-05-10 12:37:38,266] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +29: [2023-05-10 12:37:38,266] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +29: [2023-05-10 12:37:38,266] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +29: [2023-05-10 12:37:38,268] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +29: [2023-05-10 12:37:38,268] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +29: [2023-05-10 12:37:38,268] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +29: [2023-05-10 12:37:38,268] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +30: [2023-05-10 12:37:38,269] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +30: [2023-05-10 12:37:38,270] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +30: [2023-05-10 12:37:38,270] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +28: [2023-05-10 12:37:38,278] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +22: [2023-05-10 12:37:38,282] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +22: [2023-05-10 12:37:38,282] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +22: [2023-05-10 12:37:38,282] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +28: [2023-05-10 12:37:38,283] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +28: [2023-05-10 12:37:38,283] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +22: [2023-05-10 12:37:38,285] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +28: [2023-05-10 12:37:38,286] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +28: [2023-05-10 12:37:38,287] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +19: [2023-05-10 12:37:38,287] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +19: [2023-05-10 12:37:38,290] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +19: [2023-05-10 12:37:38,290] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +19: [2023-05-10 12:37:38,291] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +29: [2023-05-10 12:37:38,292] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +28: [2023-05-10 12:37:38,294] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +22: [2023-05-10 12:37:38,294] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +28: [2023-05-10 12:37:38,294] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +29: [2023-05-10 12:37:38,294] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +22: [2023-05-10 12:37:38,294] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +22: [2023-05-10 12:37:38,295] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +29: [2023-05-10 12:37:38,295] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +29: [2023-05-10 12:37:38,295] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +28: [2023-05-10 12:37:38,297] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +19: [2023-05-10 12:37:38,299] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +22: [2023-05-10 12:37:38,302] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +29: [2023-05-10 12:37:38,302] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +19: [2023-05-10 12:37:38,303] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +19: [2023-05-10 12:37:38,303] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +29: [2023-05-10 12:37:38,304] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +19: [2023-05-10 12:37:38,304] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +29: [2023-05-10 12:37:38,305] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +29: [2023-05-10 12:37:38,305] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +26: [2023-05-10 12:37:38,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt. +26: [2023-05-10 12:37:38,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt. +26: [2023-05-10 12:37:38,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt. +26: [2023-05-10 12:37:38,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt. +26: [2023-05-10 12:37:38,322] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +26: [2023-05-10 12:37:38,326] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +26: [2023-05-10 12:37:38,326] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +26: [2023-05-10 12:37:38,326] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +31: [2023-05-10 12:37:38,331] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt. +31: [2023-05-10 12:37:38,331] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt. +31: [2023-05-10 12:37:38,331] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt. +31: [2023-05-10 12:37:38,331] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt. +31: [2023-05-10 12:37:38,343] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +16: [2023-05-10 12:37:38,344] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt. +16: [2023-05-10 12:37:38,344] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt. +15: [2023-05-10 12:37:38,344] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt. +15: [2023-05-10 12:37:38,344] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt. +15: [2023-05-10 12:37:38,344] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt. +16: [2023-05-10 12:37:38,344] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt. +16: [2023-05-10 12:37:38,344] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt. +15: [2023-05-10 12:37:38,344] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt. +31: [2023-05-10 12:37:38,345] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +19: [2023-05-10 12:37:38,345] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt. +19: [2023-05-10 12:37:38,345] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt. +19: [2023-05-10 12:37:38,345] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt. +19: [2023-05-10 12:37:38,345] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt. +31: [2023-05-10 12:37:38,346] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +31: [2023-05-10 12:37:38,347] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +26: [2023-05-10 12:37:38,348] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +26: [2023-05-10 12:37:38,351] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt... +26: [2023-05-10 12:37:38,355] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +26: [2023-05-10 12:37:38,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +26: [2023-05-10 12:37:38,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +19: [2023-05-10 12:37:38,357] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +10: [2023-05-10 12:37:38,358] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +10: [2023-05-10 12:37:38,358] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +10: [2023-05-10 12:37:38,358] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +26: [2023-05-10 12:37:38,359] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt... +10: [2023-05-10 12:37:38,359] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +26: [2023-05-10 12:37:38,359] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt... +26: [2023-05-10 12:37:38,359] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt... +10: [2023-05-10 12:37:38,360] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +10: [2023-05-10 12:37:38,360] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +10: [2023-05-10 12:37:38,361] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +10: [2023-05-10 12:37:38,361] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +19: [2023-05-10 12:37:38,362] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +19: [2023-05-10 12:37:38,362] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +15: [2023-05-10 12:37:38,362] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +15: [2023-05-10 12:37:38,363] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +19: [2023-05-10 12:37:38,364] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +16: [2023-05-10 12:37:38,365] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +16: [2023-05-10 12:37:38,366] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +15: [2023-05-10 12:37:38,366] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +15: [2023-05-10 12:37:38,366] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +16: [2023-05-10 12:37:38,366] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +16: [2023-05-10 12:37:38,366] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +31: [2023-05-10 12:37:38,370] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +31: [2023-05-10 12:37:38,373] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt... +31: [2023-05-10 12:37:38,374] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +31: [2023-05-10 12:37:38,375] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +31: [2023-05-10 12:37:38,375] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +16: [2023-05-10 12:37:38,375] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +16: [2023-05-10 12:37:38,375] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +16: [2023-05-10 12:37:38,376] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +16: [2023-05-10 12:37:38,376] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +31: [2023-05-10 12:37:38,376] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt... +31: [2023-05-10 12:37:38,378] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt... +31: [2023-05-10 12:37:38,378] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt... +29: [2023-05-10 12:37:38,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt. +29: [2023-05-10 12:37:38,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt. +29: [2023-05-10 12:37:38,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt. +29: [2023-05-10 12:37:38,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt. +16: [2023-05-10 12:37:38,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +16: [2023-05-10 12:37:38,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +16: [2023-05-10 12:37:38,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +16: [2023-05-10 12:37:38,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... + 6: [2023-05-10 12:37:38,381] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt. + 6: [2023-05-10 12:37:38,381] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt. + 6: [2023-05-10 12:37:38,381] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt. + 0: [2023-05-10 12:37:38,382] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt. + 6: [2023-05-10 12:37:38,382] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt. + 0: [2023-05-10 12:37:38,382] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt. + 0: [2023-05-10 12:37:38,382] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt. + 0: [2023-05-10 12:37:38,382] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt. +14: [2023-05-10 12:37:38,381] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt. +14: [2023-05-10 12:37:38,382] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt. +14: [2023-05-10 12:37:38,382] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt. +14: [2023-05-10 12:37:38,382] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt. +19: [2023-05-10 12:37:38,384] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +28: [2023-05-10 12:37:38,385] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt. +10: [2023-05-10 12:37:38,385] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +28: [2023-05-10 12:37:38,385] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt. +28: [2023-05-10 12:37:38,385] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt. +28: [2023-05-10 12:37:38,386] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt. +19: [2023-05-10 12:37:38,387] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt... +10: [2023-05-10 12:37:38,390] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +10: [2023-05-10 12:37:38,390] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +10: [2023-05-10 12:37:38,391] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +29: [2023-05-10 12:37:38,392] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +29: [2023-05-10 12:37:38,392] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +29: [2023-05-10 12:37:38,393] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +29: [2023-05-10 12:37:38,393] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +19: [2023-05-10 12:37:38,393] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +19: [2023-05-10 12:37:38,393] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +19: [2023-05-10 12:37:38,393] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +10: [2023-05-10 12:37:38,394] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +23: [2023-05-10 12:37:38,395] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt. +23: [2023-05-10 12:37:38,395] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt. +23: [2023-05-10 12:37:38,395] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt. +23: [2023-05-10 12:37:38,395] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt. +19: [2023-05-10 12:37:38,396] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt... + 6: [2023-05-10 12:37:38,396] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +14: [2023-05-10 12:37:38,396] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +19: [2023-05-10 12:37:38,397] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt... + 6: [2023-05-10 12:37:38,397] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +19: [2023-05-10 12:37:38,397] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt... + 6: [2023-05-10 12:37:38,398] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +28: [2023-05-10 12:37:38,398] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... + 6: [2023-05-10 12:37:38,398] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +28: [2023-05-10 12:37:38,398] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +28: [2023-05-10 12:37:38,398] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +14: [2023-05-10 12:37:38,399] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +16: [2023-05-10 12:37:38,399] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +16: [2023-05-10 12:37:38,399] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +16: [2023-05-10 12:37:38,400] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +16: [2023-05-10 12:37:38,400] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +14: [2023-05-10 12:37:38,400] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +10: [2023-05-10 12:37:38,401] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +28: [2023-05-10 12:37:38,402] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +10: [2023-05-10 12:37:38,402] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +10: [2023-05-10 12:37:38,402] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... + 0: [2023-05-10 12:37:38,403] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... + 0: [2023-05-10 12:37:38,403] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... + 0: [2023-05-10 12:37:38,403] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... + 0: [2023-05-10 12:37:38,403] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +16: [2023-05-10 12:37:38,403] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt... +16: [2023-05-10 12:37:38,403] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt... +16: [2023-05-10 12:37:38,403] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt... +16: [2023-05-10 12:37:38,403] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt... +14: [2023-05-10 12:37:38,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +23: [2023-05-10 12:37:38,408] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +23: [2023-05-10 12:37:38,408] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +12: [2023-05-10 12:37:38,408] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +12: [2023-05-10 12:37:38,408] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +12: [2023-05-10 12:37:38,408] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +12: [2023-05-10 12:37:38,408] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +23: [2023-05-10 12:37:38,409] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +23: [2023-05-10 12:37:38,409] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +16: [2023-05-10 12:37:38,411] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +12: [2023-05-10 12:37:38,411] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +12: [2023-05-10 12:37:38,411] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +12: [2023-05-10 12:37:38,411] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +12: [2023-05-10 12:37:38,411] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +16: [2023-05-10 12:37:38,413] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +16: [2023-05-10 12:37:38,413] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +16: [2023-05-10 12:37:38,414] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +25: [2023-05-10 12:37:38,416] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +25: [2023-05-10 12:37:38,416] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +25: [2023-05-10 12:37:38,416] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +25: [2023-05-10 12:37:38,416] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +24: [2023-05-10 12:37:38,417] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt. +24: [2023-05-10 12:37:38,417] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt. +24: [2023-05-10 12:37:38,417] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt. +24: [2023-05-10 12:37:38,417] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt. +25: [2023-05-10 12:37:38,418] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +25: [2023-05-10 12:37:38,418] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +25: [2023-05-10 12:37:38,418] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +25: [2023-05-10 12:37:38,418] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +29: [2023-05-10 12:37:38,419] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +29: [2023-05-10 12:37:38,419] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +28: [2023-05-10 12:37:38,419] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +11: [2023-05-10 12:37:38,420] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +11: [2023-05-10 12:37:38,420] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +11: [2023-05-10 12:37:38,420] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +11: [2023-05-10 12:37:38,420] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +29: [2023-05-10 12:37:38,421] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +29: [2023-05-10 12:37:38,421] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +28: [2023-05-10 12:37:38,421] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt... +11: [2023-05-10 12:37:38,422] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +29: [2023-05-10 12:37:38,422] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt... +29: [2023-05-10 12:37:38,422] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt... +11: [2023-05-10 12:37:38,423] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +11: [2023-05-10 12:37:38,423] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +11: [2023-05-10 12:37:38,423] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +29: [2023-05-10 12:37:38,423] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt... +29: [2023-05-10 12:37:38,423] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt... +16: [2023-05-10 12:37:38,424] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +28: [2023-05-10 12:37:38,425] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +28: [2023-05-10 12:37:38,425] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +28: [2023-05-10 12:37:38,426] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +28: [2023-05-10 12:37:38,427] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt... +16: [2023-05-10 12:37:38,427] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +28: [2023-05-10 12:37:38,427] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt... +16: [2023-05-10 12:37:38,427] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +28: [2023-05-10 12:37:38,428] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt... + 4: [2023-05-10 12:37:38,430] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. + 4: [2023-05-10 12:37:38,430] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +24: [2023-05-10 12:37:38,430] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +24: [2023-05-10 12:37:38,430] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... + 4: [2023-05-10 12:37:38,430] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +16: [2023-05-10 12:37:38,430] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +24: [2023-05-10 12:37:38,430] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... + 4: [2023-05-10 12:37:38,430] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +24: [2023-05-10 12:37:38,431] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... + 4: [2023-05-10 12:37:38,432] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... + 4: [2023-05-10 12:37:38,432] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... + 4: [2023-05-10 12:37:38,432] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... + 4: [2023-05-10 12:37:38,433] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +23: [2023-05-10 12:37:38,435] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +23: [2023-05-10 12:37:38,435] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +23: [2023-05-10 12:37:38,438] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +23: [2023-05-10 12:37:38,438] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +23: [2023-05-10 12:37:38,438] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt... +23: [2023-05-10 12:37:38,438] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt... +12: [2023-05-10 12:37:38,439] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +12: [2023-05-10 12:37:38,439] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +23: [2023-05-10 12:37:38,440] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt... +23: [2023-05-10 12:37:38,440] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt... +12: [2023-05-10 12:37:38,441] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +12: [2023-05-10 12:37:38,441] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +25: [2023-05-10 12:37:38,442] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +25: [2023-05-10 12:37:38,443] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +25: [2023-05-10 12:37:38,445] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +25: [2023-05-10 12:37:38,445] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +31: [2023-05-10 12:37:38,446] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +31: [2023-05-10 12:37:38,446] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +31: [2023-05-10 12:37:38,446] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +31: [2023-05-10 12:37:38,446] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +31: [2023-05-10 12:37:38,446] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +31: [2023-05-10 12:37:38,446] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +31: [2023-05-10 12:37:38,446] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +31: [2023-05-10 12:37:38,446] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +12: [2023-05-10 12:37:38,448] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +12: [2023-05-10 12:37:38,448] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +11: [2023-05-10 12:37:38,449] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +11: [2023-05-10 12:37:38,449] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +11: [2023-05-10 12:37:38,450] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +11: [2023-05-10 12:37:38,450] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +12: [2023-05-10 12:37:38,451] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +12: [2023-05-10 12:37:38,451] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +25: [2023-05-10 12:37:38,452] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +25: [2023-05-10 12:37:38,452] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +25: [2023-05-10 12:37:38,455] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +25: [2023-05-10 12:37:38,455] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... + 4: [2023-05-10 12:37:38,457] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. + 2: [2023-05-10 12:37:38,458] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt. + 2: [2023-05-10 12:37:38,458] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt. + 2: [2023-05-10 12:37:38,458] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt. + 2: [2023-05-10 12:37:38,459] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt. + 3: [2023-05-10 12:37:38,459] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt. + 3: [2023-05-10 12:37:38,459] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt. +17: [2023-05-10 12:37:38,459] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt. + 3: [2023-05-10 12:37:38,459] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt. +17: [2023-05-10 12:37:38,459] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt. +17: [2023-05-10 12:37:38,459] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt. + 7: [2023-05-10 12:37:38,459] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt. + 7: [2023-05-10 12:37:38,459] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt. + 7: [2023-05-10 12:37:38,459] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt. + 3: [2023-05-10 12:37:38,459] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt. +17: [2023-05-10 12:37:38,459] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt. + 7: [2023-05-10 12:37:38,459] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt. +11: [2023-05-10 12:37:38,460] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +11: [2023-05-10 12:37:38,460] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +31: [2023-05-10 12:37:38,460] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +31: [2023-05-10 12:37:38,461] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. + 4: [2023-05-10 12:37:38,461] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +31: [2023-05-10 12:37:38,461] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +31: [2023-05-10 12:37:38,461] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +11: [2023-05-10 12:37:38,462] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +11: [2023-05-10 12:37:38,462] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... + 4: [2023-05-10 12:37:38,463] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +12: [2023-05-10 12:37:38,463] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt. +12: [2023-05-10 12:37:38,463] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt. +12: [2023-05-10 12:37:38,463] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt. +12: [2023-05-10 12:37:38,464] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt. +30: [2023-05-10 12:37:38,464] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt. +30: [2023-05-10 12:37:38,464] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt. + 4: [2023-05-10 12:37:38,464] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +30: [2023-05-10 12:37:38,464] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt. +30: [2023-05-10 12:37:38,464] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt. + 4: [2023-05-10 12:37:38,466] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... + 6: [2023-05-10 12:37:38,468] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. + 6: [2023-05-10 12:37:38,468] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. + 6: [2023-05-10 12:37:38,468] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. + 6: [2023-05-10 12:37:38,468] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. + 6: [2023-05-10 12:37:38,469] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +17: [2023-05-10 12:37:38,470] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. + 6: [2023-05-10 12:37:38,469] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. + 6: [2023-05-10 12:37:38,469] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. + 6: [2023-05-10 12:37:38,469] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +13: [2023-05-10 12:37:38,470] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +13: [2023-05-10 12:37:38,470] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +13: [2023-05-10 12:37:38,470] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +17: [2023-05-10 12:37:38,470] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +17: [2023-05-10 12:37:38,470] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +14: [2023-05-10 12:37:38,470] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +14: [2023-05-10 12:37:38,470] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +14: [2023-05-10 12:37:38,470] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +14: [2023-05-10 12:37:38,470] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +14: [2023-05-10 12:37:38,470] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +14: [2023-05-10 12:37:38,470] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +14: [2023-05-10 12:37:38,471] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +14: [2023-05-10 12:37:38,471] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. + 6: [2023-05-10 12:37:38,471] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +31: [2023-05-10 12:37:38,471] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +17: [2023-05-10 12:37:38,471] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +31: [2023-05-10 12:37:38,472] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... + 6: [2023-05-10 12:37:38,472] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... + 6: [2023-05-10 12:37:38,472] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +13: [2023-05-10 12:37:38,472] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +24: [2023-05-10 12:37:38,472] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. + 4: [2023-05-10 12:37:38,472] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... + 6: [2023-05-10 12:37:38,472] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +13: [2023-05-10 12:37:38,472] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +24: [2023-05-10 12:37:38,472] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +24: [2023-05-10 12:37:38,472] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +24: [2023-05-10 12:37:38,472] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +24: [2023-05-10 12:37:38,472] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +24: [2023-05-10 12:37:38,472] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. + 6: [2023-05-10 12:37:38,472] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt... + 6: [2023-05-10 12:37:38,472] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt... +24: [2023-05-10 12:37:38,472] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +31: [2023-05-10 12:37:38,472] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... + 6: [2023-05-10 12:37:38,472] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt... +24: [2023-05-10 12:37:38,472] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. + 6: [2023-05-10 12:37:38,472] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt... +31: [2023-05-10 12:37:38,472] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +17: [2023-05-10 12:37:38,473] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +15: [2023-05-10 12:37:38,472] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +15: [2023-05-10 12:37:38,472] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +15: [2023-05-10 12:37:38,472] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +15: [2023-05-10 12:37:38,472] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +15: [2023-05-10 12:37:38,473] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +17: [2023-05-10 12:37:38,473] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +15: [2023-05-10 12:37:38,473] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +15: [2023-05-10 12:37:38,473] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +15: [2023-05-10 12:37:38,473] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +17: [2023-05-10 12:37:38,473] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +14: [2023-05-10 12:37:38,473] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt... +17: [2023-05-10 12:37:38,473] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +17: [2023-05-10 12:37:38,474] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... + 7: [2023-05-10 12:37:38,474] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... + 7: [2023-05-10 12:37:38,474] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +13: [2023-05-10 12:37:38,474] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +14: [2023-05-10 12:37:38,474] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt... +13: [2023-05-10 12:37:38,474] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... + 2: [2023-05-10 12:37:38,474] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +14: [2023-05-10 12:37:38,474] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +14: [2023-05-10 12:37:38,474] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt... +14: [2023-05-10 12:37:38,474] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt... +14: [2023-05-10 12:37:38,474] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +14: [2023-05-10 12:37:38,474] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... + 2: [2023-05-10 12:37:38,474] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. + 2: [2023-05-10 12:37:38,474] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. + 2: [2023-05-10 12:37:38,474] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +14: [2023-05-10 12:37:38,475] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... + 7: [2023-05-10 12:37:38,475] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... + 2: [2023-05-10 12:37:38,475] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. + 7: [2023-05-10 12:37:38,475] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +17: [2023-05-10 12:37:38,475] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +17: [2023-05-10 12:37:38,475] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +17: [2023-05-10 12:37:38,475] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +15: [2023-05-10 12:37:38,475] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +24: [2023-05-10 12:37:38,475] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... + 2: [2023-05-10 12:37:38,475] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... + 2: [2023-05-10 12:37:38,475] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +24: [2023-05-10 12:37:38,475] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt... +24: [2023-05-10 12:37:38,475] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt... +24: [2023-05-10 12:37:38,475] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt... +24: [2023-05-10 12:37:38,475] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +24: [2023-05-10 12:37:38,475] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt... +12: [2023-05-10 12:37:38,475] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +12: [2023-05-10 12:37:38,475] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +24: [2023-05-10 12:37:38,476] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... + 4: [2023-05-10 12:37:38,476] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... + 4: [2023-05-10 12:37:38,476] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +13: [2023-05-10 12:37:38,476] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +24: [2023-05-10 12:37:38,476] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... + 2: [2023-05-10 12:37:38,476] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... + 2: [2023-05-10 12:37:38,477] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +15: [2023-05-10 12:37:38,477] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt... +15: [2023-05-10 12:37:38,477] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt... +15: [2023-05-10 12:37:38,477] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt... + 2: [2023-05-10 12:37:38,477] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... + 2: [2023-05-10 12:37:38,478] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +15: [2023-05-10 12:37:38,478] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... + 2: [2023-05-10 12:37:38,478] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... + 9: [2023-05-10 12:37:38,478] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt. + 9: [2023-05-10 12:37:38,478] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt. +15: [2023-05-10 12:37:38,478] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +12: [2023-05-10 12:37:38,478] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +27: [2023-05-10 12:37:38,478] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. + 9: [2023-05-10 12:37:38,478] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt. +12: [2023-05-10 12:37:38,478] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +27: [2023-05-10 12:37:38,478] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +15: [2023-05-10 12:37:38,478] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +27: [2023-05-10 12:37:38,478] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. + 9: [2023-05-10 12:37:38,478] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt. +15: [2023-05-10 12:37:38,478] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt... + 3: [2023-05-10 12:37:38,479] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. + 3: [2023-05-10 12:37:38,479] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. + 3: [2023-05-10 12:37:38,479] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... + 3: [2023-05-10 12:37:38,479] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +27: [2023-05-10 12:37:38,480] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. + 3: [2023-05-10 12:37:38,480] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... + 3: [2023-05-10 12:37:38,481] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... + 3: [2023-05-10 12:37:38,481] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... + 3: [2023-05-10 12:37:38,482] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... + 3: [2023-05-10 12:37:38,483] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +27: [2023-05-10 12:37:38,483] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... + 3: [2023-05-10 12:37:38,483] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. + 3: [2023-05-10 12:37:38,483] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +25: [2023-05-10 12:37:38,483] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt. +25: [2023-05-10 12:37:38,483] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt. +25: [2023-05-10 12:37:38,483] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt. + 3: [2023-05-10 12:37:38,483] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +27: [2023-05-10 12:37:38,483] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +25: [2023-05-10 12:37:38,483] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt. +27: [2023-05-10 12:37:38,483] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... + 8: [2023-05-10 12:37:38,484] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. + 8: [2023-05-10 12:37:38,484] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. + 8: [2023-05-10 12:37:38,484] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +27: [2023-05-10 12:37:38,484] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... + 8: [2023-05-10 12:37:38,484] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +30: [2023-05-10 12:37:38,485] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... + 4: [2023-05-10 12:37:38,485] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt. + 4: [2023-05-10 12:37:38,485] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt. + 4: [2023-05-10 12:37:38,485] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt. + 4: [2023-05-10 12:37:38,485] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt. +20: [2023-05-10 12:37:38,485] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +20: [2023-05-10 12:37:38,485] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +30: [2023-05-10 12:37:38,486] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +30: [2023-05-10 12:37:38,486] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +30: [2023-05-10 12:37:38,486] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +20: [2023-05-10 12:37:38,486] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +20: [2023-05-10 12:37:38,487] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... + 8: [2023-05-10 12:37:38,488] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... + 8: [2023-05-10 12:37:38,489] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... + 8: [2023-05-10 12:37:38,489] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... + 8: [2023-05-10 12:37:38,489] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +20: [2023-05-10 12:37:38,489] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +20: [2023-05-10 12:37:38,489] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +20: [2023-05-10 12:37:38,489] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +20: [2023-05-10 12:37:38,489] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... + 5: [2023-05-10 12:37:38,490] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt. + 5: [2023-05-10 12:37:38,490] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt. + 5: [2023-05-10 12:37:38,490] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt. +18: [2023-05-10 12:37:38,490] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +18: [2023-05-10 12:37:38,490] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +27: [2023-05-10 12:37:38,490] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt. +27: [2023-05-10 12:37:38,490] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt. +18: [2023-05-10 12:37:38,490] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +27: [2023-05-10 12:37:38,490] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt. +18: [2023-05-10 12:37:38,490] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt. +18: [2023-05-10 12:37:38,490] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt. +27: [2023-05-10 12:37:38,491] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt. +13: [2023-05-10 12:37:38,491] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt. + 5: [2023-05-10 12:37:38,491] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt. +18: [2023-05-10 12:37:38,490] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +13: [2023-05-10 12:37:38,491] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt. +18: [2023-05-10 12:37:38,491] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt. +18: [2023-05-10 12:37:38,491] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt. +13: [2023-05-10 12:37:38,491] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt. + 1: [2023-05-10 12:37:38,491] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt. + 1: [2023-05-10 12:37:38,491] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt. + 1: [2023-05-10 12:37:38,491] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt. +13: [2023-05-10 12:37:38,491] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt. + 1: [2023-05-10 12:37:38,491] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt. +10: [2023-05-10 12:37:38,491] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt. +10: [2023-05-10 12:37:38,491] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt. +10: [2023-05-10 12:37:38,491] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt. +21: [2023-05-10 12:37:38,492] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +21: [2023-05-10 12:37:38,492] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +21: [2023-05-10 12:37:38,492] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +10: [2023-05-10 12:37:38,492] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt. + 7: [2023-05-10 12:37:38,492] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. + 7: [2023-05-10 12:37:38,492] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +21: [2023-05-10 12:37:38,492] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. + 7: [2023-05-10 12:37:38,492] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. + 7: [2023-05-10 12:37:38,492] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. + 9: [2023-05-10 12:37:38,494] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +18: [2023-05-10 12:37:38,494] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +18: [2023-05-10 12:37:38,494] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... + 9: [2023-05-10 12:37:38,494] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. + 9: [2023-05-10 12:37:38,494] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +18: [2023-05-10 12:37:38,494] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +21: [2023-05-10 12:37:38,494] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +21: [2023-05-10 12:37:38,494] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +18: [2023-05-10 12:37:38,494] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... + 7: [2023-05-10 12:37:38,494] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... + 9: [2023-05-10 12:37:38,494] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +21: [2023-05-10 12:37:38,495] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... + 7: [2023-05-10 12:37:38,495] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... + 7: [2023-05-10 12:37:38,495] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +21: [2023-05-10 12:37:38,495] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... + 7: [2023-05-10 12:37:38,495] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... + 9: [2023-05-10 12:37:38,496] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +25: [2023-05-10 12:37:38,496] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... + 6: [2023-05-10 12:37:38,496] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +25: [2023-05-10 12:37:38,496] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... + 0: [2023-05-10 12:37:38,497] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. + 9: [2023-05-10 12:37:38,497] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... + 1: [2023-05-10 12:37:38,497] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. + 1: [2023-05-10 12:37:38,497] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +25: [2023-05-10 12:37:38,497] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... + 9: [2023-05-10 12:37:38,497] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... + 0: [2023-05-10 12:37:38,498] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. + 0: [2023-05-10 12:37:38,498] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. + 0: [2023-05-10 12:37:38,498] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. + 0: [2023-05-10 12:37:38,498] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. + 0: [2023-05-10 12:37:38,498] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. + 0: [2023-05-10 12:37:38,498] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. + 0: [2023-05-10 12:37:38,498] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. + 9: [2023-05-10 12:37:38,498] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +25: [2023-05-10 12:37:38,498] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... + 4: [2023-05-10 12:37:38,498] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... + 4: [2023-05-10 12:37:38,499] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... + 4: [2023-05-10 12:37:38,499] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... + 9: [2023-05-10 12:37:38,499] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... + 4: [2023-05-10 12:37:38,499] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... + 9: [2023-05-10 12:37:38,499] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +17: [2023-05-10 12:37:38,499] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. + 9: [2023-05-10 12:37:38,499] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... + 5: [2023-05-10 12:37:38,499] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. + 5: [2023-05-10 12:37:38,499] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. + 1: [2023-05-10 12:37:38,500] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. + 9: [2023-05-10 12:37:38,500] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... + 2: [2023-05-10 12:37:38,500] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. + 1: [2023-05-10 12:37:38,500] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. + 3: [2023-05-10 12:37:38,500] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +14: [2023-05-10 12:37:38,500] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +12: [2023-05-10 12:37:38,501] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. + 0: [2023-05-10 12:37:38,501] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt... + 6: [2023-05-10 12:37:38,501] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. + 1: [2023-05-10 12:37:38,501] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... + 1: [2023-05-10 12:37:38,501] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +12: [2023-05-10 12:37:38,502] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +24: [2023-05-10 12:37:38,502] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. + 6: [2023-05-10 12:37:38,502] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. + 6: [2023-05-10 12:37:38,502] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +15: [2023-05-10 12:37:38,502] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +17: [2023-05-10 12:37:38,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +12: [2023-05-10 12:37:38,503] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt... + 3: [2023-05-10 12:37:38,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. + 3: [2023-05-10 12:37:38,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. + 7: [2023-05-10 12:37:38,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. + 7: [2023-05-10 12:37:38,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +18: [2023-05-10 12:37:38,503] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +13: [2023-05-10 12:37:38,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +24: [2023-05-10 12:37:38,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. + 5: [2023-05-10 12:37:38,503] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +18: [2023-05-10 12:37:38,503] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... + 5: [2023-05-10 12:37:38,503] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... + 5: [2023-05-10 12:37:38,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +12: [2023-05-10 12:37:38,504] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt... +14: [2023-05-10 12:37:38,504] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. + 5: [2023-05-10 12:37:38,504] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. + 7: [2023-05-10 12:37:38,504] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +14: [2023-05-10 12:37:38,504] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +14: [2023-05-10 12:37:38,504] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. + 1: [2023-05-10 12:37:38,504] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... + 2: [2023-05-10 12:37:38,504] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +24: [2023-05-10 12:37:38,504] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. + 1: [2023-05-10 12:37:38,505] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... + 0: [2023-05-10 12:37:38,505] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... + 7: [2023-05-10 12:37:38,505] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt... + 7: [2023-05-10 12:37:38,505] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt... + 0: [2023-05-10 12:37:38,505] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt... +20: [2023-05-10 12:37:38,505] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +20: [2023-05-10 12:37:38,505] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +20: [2023-05-10 12:37:38,505] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. + 0: [2023-05-10 12:37:38,506] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt... +20: [2023-05-10 12:37:38,506] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. + 0: [2023-05-10 12:37:38,506] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +17: [2023-05-10 12:37:38,506] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +17: [2023-05-10 12:37:38,506] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +17: [2023-05-10 12:37:38,506] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. + 0: [2023-05-10 12:37:38,506] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +24: [2023-05-10 12:37:38,506] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. + 0: [2023-05-10 12:37:38,506] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... + 0: [2023-05-10 12:37:38,506] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt... + 2: [2023-05-10 12:37:38,505] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. + 2: [2023-05-10 12:37:38,505] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. + 2: [2023-05-10 12:37:38,505] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. + 7: [2023-05-10 12:37:38,506] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt... + 2: [2023-05-10 12:37:38,506] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. + 2: [2023-05-10 12:37:38,506] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +12: [2023-05-10 12:37:38,506] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. + 6: [2023-05-10 12:37:38,506] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +12: [2023-05-10 12:37:38,506] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. + 2: [2023-05-10 12:37:38,507] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +18: [2023-05-10 12:37:38,507] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +18: [2023-05-10 12:37:38,507] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +27: [2023-05-10 12:37:38,507] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... + 2: [2023-05-10 12:37:38,507] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt... + 7: [2023-05-10 12:37:38,507] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +13: [2023-05-10 12:37:38,507] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +10: [2023-05-10 12:37:38,508] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +10: [2023-05-10 12:37:38,508] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... + 5: [2023-05-10 12:37:38,508] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... + 2: [2023-05-10 12:37:38,508] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt... +17: [2023-05-10 12:37:38,508] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +17: [2023-05-10 12:37:38,508] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. + 2: [2023-05-10 12:37:38,508] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt... +17: [2023-05-10 12:37:38,508] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +17: [2023-05-10 12:37:38,508] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. + 5: [2023-05-10 12:37:38,508] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... + 3: [2023-05-10 12:37:38,508] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +15: [2023-05-10 12:37:38,508] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. + 1: [2023-05-10 12:37:38,509] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +13: [2023-05-10 12:37:38,509] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +17: [2023-05-10 12:37:38,509] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt... +15: [2023-05-10 12:37:38,509] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +15: [2023-05-10 12:37:38,510] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +17: [2023-05-10 12:37:38,509] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt... +12: [2023-05-10 12:37:38,509] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt... + 2: [2023-05-10 12:37:38,510] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt... +12: [2023-05-10 12:37:38,510] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt... + 7: [2023-05-10 12:37:38,510] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt... +13: [2023-05-10 12:37:38,510] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +13: [2023-05-10 12:37:38,510] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... + 2: [2023-05-10 12:37:38,511] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +27: [2023-05-10 12:37:38,511] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +27: [2023-05-10 12:37:38,511] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +30: [2023-05-10 12:37:38,511] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +17: [2023-05-10 12:37:38,512] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt... +17: [2023-05-10 12:37:38,512] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt... + 6: [2023-05-10 12:37:38,512] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +15: [2023-05-10 12:37:38,512] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... + 5: [2023-05-10 12:37:38,512] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... + 5: [2023-05-10 12:37:38,512] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... + 1: [2023-05-10 12:37:38,512] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... + 1: [2023-05-10 12:37:38,512] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... + 1: [2023-05-10 12:37:38,512] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... + 6: [2023-05-10 12:37:38,513] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... + 5: [2023-05-10 12:37:38,513] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... + 6: [2023-05-10 12:37:38,513] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +14: [2023-05-10 12:37:38,513] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +22: [2023-05-10 12:37:38,513] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt. +13: [2023-05-10 12:37:38,513] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +13: [2023-05-10 12:37:38,513] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +13: [2023-05-10 12:37:38,513] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +22: [2023-05-10 12:37:38,514] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt. +22: [2023-05-10 12:37:38,514] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt. +24: [2023-05-10 12:37:38,513] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +24: [2023-05-10 12:37:38,513] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +22: [2023-05-10 12:37:38,514] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt. +27: [2023-05-10 12:37:38,514] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +27: [2023-05-10 12:37:38,514] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +17: [2023-05-10 12:37:38,514] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... + 3: [2023-05-10 12:37:38,514] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +30: [2023-05-10 12:37:38,514] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt... +10: [2023-05-10 12:37:38,515] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +24: [2023-05-10 12:37:38,515] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... + 5: [2023-05-10 12:37:38,515] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +10: [2023-05-10 12:37:38,515] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +13: [2023-05-10 12:37:38,515] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +14: [2023-05-10 12:37:38,516] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... + 2: [2023-05-10 12:37:38,516] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +20: [2023-05-10 12:37:38,517] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +20: [2023-05-10 12:37:38,517] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +20: [2023-05-10 12:37:38,517] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... + 2: [2023-05-10 12:37:38,517] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +20: [2023-05-10 12:37:38,517] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +14: [2023-05-10 12:37:38,517] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... + 3: [2023-05-10 12:37:38,517] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +24: [2023-05-10 12:37:38,518] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +17: [2023-05-10 12:37:38,518] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +14: [2023-05-10 12:37:38,518] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +17: [2023-05-10 12:37:38,518] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +27: [2023-05-10 12:37:38,519] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. + 2: [2023-05-10 12:37:38,519] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +30: [2023-05-10 12:37:38,519] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. + 3: [2023-05-10 12:37:38,519] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. + 3: [2023-05-10 12:37:38,519] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +30: [2023-05-10 12:37:38,520] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +30: [2023-05-10 12:37:38,520] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. + 8: [2023-05-10 12:37:38,520] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +25: [2023-05-10 12:37:38,521] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +11: [2023-05-10 12:37:38,521] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt. +11: [2023-05-10 12:37:38,521] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt. +15: [2023-05-10 12:37:38,522] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +11: [2023-05-10 12:37:38,522] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt. +27: [2023-05-10 12:37:38,522] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +21: [2023-05-10 12:37:38,522] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +21: [2023-05-10 12:37:38,522] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +27: [2023-05-10 12:37:38,522] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +15: [2023-05-10 12:37:38,522] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +25: [2023-05-10 12:37:38,523] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt... +11: [2023-05-10 12:37:38,523] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt. +15: [2023-05-10 12:37:38,523] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... + 8: [2023-05-10 12:37:38,523] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. + 8: [2023-05-10 12:37:38,523] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. + 8: [2023-05-10 12:37:38,523] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +30: [2023-05-10 12:37:38,523] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt... +25: [2023-05-10 12:37:38,523] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. + 7: [2023-05-10 12:37:38,523] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. + 3: [2023-05-10 12:37:38,523] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +25: [2023-05-10 12:37:38,523] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. + 3: [2023-05-10 12:37:38,523] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt... + 3: [2023-05-10 12:37:38,524] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... + 9: [2023-05-10 12:37:38,523] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. + 8: [2023-05-10 12:37:38,524] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt. + 8: [2023-05-10 12:37:38,524] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt. + 3: [2023-05-10 12:37:38,524] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt... + 8: [2023-05-10 12:37:38,524] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt. +30: [2023-05-10 12:37:38,524] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt... + 3: [2023-05-10 12:37:38,524] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt... + 8: [2023-05-10 12:37:38,524] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt. +30: [2023-05-10 12:37:38,524] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt... + 3: [2023-05-10 12:37:38,524] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +25: [2023-05-10 12:37:38,525] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt... +25: [2023-05-10 12:37:38,525] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt... +21: [2023-05-10 12:37:38,525] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +21: [2023-05-10 12:37:38,525] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. + 9: [2023-05-10 12:37:38,525] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +27: [2023-05-10 12:37:38,526] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +22: [2023-05-10 12:37:38,526] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... + 9: [2023-05-10 12:37:38,526] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt... +25: [2023-05-10 12:37:38,526] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +22: [2023-05-10 12:37:38,526] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +22: [2023-05-10 12:37:38,527] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +13: [2023-05-10 12:37:38,527] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... + 7: [2023-05-10 12:37:38,527] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. + 7: [2023-05-10 12:37:38,527] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. + 7: [2023-05-10 12:37:38,527] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. + 4: [2023-05-10 12:37:38,527] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. + 4: [2023-05-10 12:37:38,527] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. + 4: [2023-05-10 12:37:38,528] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. + 4: [2023-05-10 12:37:38,528] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +13: [2023-05-10 12:37:38,528] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +13: [2023-05-10 12:37:38,528] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... + 9: [2023-05-10 12:37:38,528] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. + 3: [2023-05-10 12:37:38,528] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +22: [2023-05-10 12:37:38,528] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +25: [2023-05-10 12:37:38,529] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt... + 9: [2023-05-10 12:37:38,529] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. + 4: [2023-05-10 12:37:38,529] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt... + 4: [2023-05-10 12:37:38,529] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt... + 4: [2023-05-10 12:37:38,530] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt... + 4: [2023-05-10 12:37:38,530] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt... +21: [2023-05-10 12:37:38,531] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... + 9: [2023-05-10 12:37:38,531] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. + 9: [2023-05-10 12:37:38,531] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. + 9: [2023-05-10 12:37:38,532] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. + 8: [2023-05-10 12:37:38,532] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +27: [2023-05-10 12:37:38,532] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... + 3: [2023-05-10 12:37:38,532] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt... + 1: [2023-05-10 12:37:38,532] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. + 1: [2023-05-10 12:37:38,532] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +18: [2023-05-10 12:37:38,532] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +18: [2023-05-10 12:37:38,532] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. + 9: [2023-05-10 12:37:38,533] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. + 7: [2023-05-10 12:37:38,533] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +21: [2023-05-10 12:37:38,534] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +11: [2023-05-10 12:37:38,534] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... + 9: [2023-05-10 12:37:38,535] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt... +18: [2023-05-10 12:37:38,535] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt... +18: [2023-05-10 12:37:38,535] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt... +10: [2023-05-10 12:37:38,535] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +10: [2023-05-10 12:37:38,535] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +18: [2023-05-10 12:37:38,536] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +18: [2023-05-10 12:37:38,536] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +18: [2023-05-10 12:37:38,536] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. + 9: [2023-05-10 12:37:38,536] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt... +18: [2023-05-10 12:37:38,536] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. + 5: [2023-05-10 12:37:38,536] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. + 5: [2023-05-10 12:37:38,536] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. + 7: [2023-05-10 12:37:38,537] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... + 9: [2023-05-10 12:37:38,537] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt... +21: [2023-05-10 12:37:38,537] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +21: [2023-05-10 12:37:38,537] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... + 7: [2023-05-10 12:37:38,537] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +11: [2023-05-10 12:37:38,537] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +11: [2023-05-10 12:37:38,537] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... + 7: [2023-05-10 12:37:38,537] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... + 9: [2023-05-10 12:37:38,538] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +27: [2023-05-10 12:37:38,538] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +27: [2023-05-10 12:37:38,538] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... + 8: [2023-05-10 12:37:38,538] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +27: [2023-05-10 12:37:38,538] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. + 8: [2023-05-10 12:37:38,539] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +10: [2023-05-10 12:37:38,539] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt... +10: [2023-05-10 12:37:38,539] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt... + 8: [2023-05-10 12:37:38,539] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... + 1: [2023-05-10 12:37:38,539] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +23: [2023-05-10 12:37:38,540] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +23: [2023-05-10 12:37:38,540] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +23: [2023-05-10 12:37:38,540] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +23: [2023-05-10 12:37:38,540] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +23: [2023-05-10 12:37:38,540] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +23: [2023-05-10 12:37:38,540] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +11: [2023-05-10 12:37:38,540] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +23: [2023-05-10 12:37:38,540] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. + 1: [2023-05-10 12:37:38,540] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. + 1: [2023-05-10 12:37:38,540] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +23: [2023-05-10 12:37:38,541] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... + 9: [2023-05-10 12:37:38,541] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +27: [2023-05-10 12:37:38,541] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt... +13: [2023-05-10 12:37:38,541] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +13: [2023-05-10 12:37:38,541] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. + 9: [2023-05-10 12:37:38,542] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... + 1: [2023-05-10 12:37:38,542] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. + 1: [2023-05-10 12:37:38,543] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt... +27: [2023-05-10 12:37:38,544] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +27: [2023-05-10 12:37:38,544] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. + 0: [2023-05-10 12:37:38,544] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. + 0: [2023-05-10 12:37:38,544] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. + 0: [2023-05-10 12:37:38,544] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. + 0: [2023-05-10 12:37:38,544] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +10: [2023-05-10 12:37:38,544] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +10: [2023-05-10 12:37:38,544] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +13: [2023-05-10 12:37:38,545] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt... +13: [2023-05-10 12:37:38,545] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt... + 1: [2023-05-10 12:37:38,546] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt... +27: [2023-05-10 12:37:38,547] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt... +27: [2023-05-10 12:37:38,547] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt... +13: [2023-05-10 12:37:38,547] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +13: [2023-05-10 12:37:38,547] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. + 1: [2023-05-10 12:37:38,547] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... + 9: [2023-05-10 12:37:38,547] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... + 5: [2023-05-10 12:37:38,547] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +10: [2023-05-10 12:37:38,548] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt... + 5: [2023-05-10 12:37:38,548] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. + 5: [2023-05-10 12:37:38,548] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. + 5: [2023-05-10 12:37:38,548] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. + 5: [2023-05-10 12:37:38,548] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. + 5: [2023-05-10 12:37:38,548] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... + 1: [2023-05-10 12:37:38,549] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +10: [2023-05-10 12:37:38,549] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt... + 5: [2023-05-10 12:37:38,549] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +27: [2023-05-10 12:37:38,550] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. + 8: [2023-05-10 12:37:38,546] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +13: [2023-05-10 12:37:38,549] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt... +13: [2023-05-10 12:37:38,549] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt... + 8: [2023-05-10 12:37:38,546] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... + 8: [2023-05-10 12:37:38,548] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... + 8: [2023-05-10 12:37:38,548] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... + 5: [2023-05-10 12:37:38,550] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... + 1: [2023-05-10 12:37:38,550] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. + 1: [2023-05-10 12:37:38,550] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +18: [2023-05-10 12:37:38,551] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +18: [2023-05-10 12:37:38,551] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +18: [2023-05-10 12:37:38,551] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +18: [2023-05-10 12:37:38,551] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +18: [2023-05-10 12:37:38,552] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +18: [2023-05-10 12:37:38,552] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. + 5: [2023-05-10 12:37:38,553] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt... + 5: [2023-05-10 12:37:38,553] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt... + 5: [2023-05-10 12:37:38,553] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt... +27: [2023-05-10 12:37:38,553] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt... + 1: [2023-05-10 12:37:38,553] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +23: [2023-05-10 12:37:38,553] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. + 1: [2023-05-10 12:37:38,554] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +18: [2023-05-10 12:37:38,554] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt... + 5: [2023-05-10 12:37:38,554] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt... +18: [2023-05-10 12:37:38,554] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt... +23: [2023-05-10 12:37:38,555] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. + 1: [2023-05-10 12:37:38,555] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt... + 1: [2023-05-10 12:37:38,555] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt... +23: [2023-05-10 12:37:38,555] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +23: [2023-05-10 12:37:38,558] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +20: [2023-05-10 12:37:38,559] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt. +20: [2023-05-10 12:37:38,559] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt. +20: [2023-05-10 12:37:38,559] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt. +20: [2023-05-10 12:37:38,559] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt. +11: [2023-05-10 12:37:38,560] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. + 0: [2023-05-10 12:37:38,560] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... + 5: [2023-05-10 12:37:38,560] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... + 0: [2023-05-10 12:37:38,560] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... + 0: [2023-05-10 12:37:38,560] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... + 0: [2023-05-10 12:37:38,560] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... + 5: [2023-05-10 12:37:38,561] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +26: [2023-05-10 12:37:38,561] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +26: [2023-05-10 12:37:38,561] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +21: [2023-05-10 12:37:38,562] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt. +21: [2023-05-10 12:37:38,562] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt. +21: [2023-05-10 12:37:38,562] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt. +21: [2023-05-10 12:37:38,562] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_03-model_01-model_states.pt. +26: [2023-05-10 12:37:38,562] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +11: [2023-05-10 12:37:38,562] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt... +26: [2023-05-10 12:37:38,562] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +23: [2023-05-10 12:37:38,564] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +31: [2023-05-10 12:37:38,564] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt. +31: [2023-05-10 12:37:38,564] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt. +31: [2023-05-10 12:37:38,564] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt. +31: [2023-05-10 12:37:38,564] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt. +11: [2023-05-10 12:37:38,564] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +23: [2023-05-10 12:37:38,565] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +26: [2023-05-10 12:37:38,564] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +26: [2023-05-10 12:37:38,564] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +26: [2023-05-10 12:37:38,564] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +26: [2023-05-10 12:37:38,565] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +11: [2023-05-10 12:37:38,566] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +11: [2023-05-10 12:37:38,566] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt... +23: [2023-05-10 12:37:38,567] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +22: [2023-05-10 12:37:38,567] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +22: [2023-05-10 12:37:38,567] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +11: [2023-05-10 12:37:38,567] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +22: [2023-05-10 12:37:38,567] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +22: [2023-05-10 12:37:38,567] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +22: [2023-05-10 12:37:38,567] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +22: [2023-05-10 12:37:38,567] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +22: [2023-05-10 12:37:38,567] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +22: [2023-05-10 12:37:38,567] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +22: [2023-05-10 12:37:38,567] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt... +22: [2023-05-10 12:37:38,567] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +22: [2023-05-10 12:37:38,568] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +22: [2023-05-10 12:37:38,568] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +30: [2023-05-10 12:37:38,567] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +30: [2023-05-10 12:37:38,567] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +30: [2023-05-10 12:37:38,567] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +30: [2023-05-10 12:37:38,567] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +30: [2023-05-10 12:37:38,567] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +22: [2023-05-10 12:37:38,568] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +22: [2023-05-10 12:37:38,568] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt... +30: [2023-05-10 12:37:38,567] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +30: [2023-05-10 12:37:38,567] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +30: [2023-05-10 12:37:38,567] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +22: [2023-05-10 12:37:38,568] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt... +22: [2023-05-10 12:37:38,568] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt... +28: [2023-05-10 12:37:38,568] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +28: [2023-05-10 12:37:38,568] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +28: [2023-05-10 12:37:38,568] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +28: [2023-05-10 12:37:38,568] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +28: [2023-05-10 12:37:38,568] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +28: [2023-05-10 12:37:38,568] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +28: [2023-05-10 12:37:38,568] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +28: [2023-05-10 12:37:38,568] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +11: [2023-05-10 12:37:38,569] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt... +29: [2023-05-10 12:37:38,570] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +11: [2023-05-10 12:37:38,570] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt... +29: [2023-05-10 12:37:38,570] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +29: [2023-05-10 12:37:38,570] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +29: [2023-05-10 12:37:38,570] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +29: [2023-05-10 12:37:38,570] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +29: [2023-05-10 12:37:38,570] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +29: [2023-05-10 12:37:38,570] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +29: [2023-05-10 12:37:38,570] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +23: [2023-05-10 12:37:38,571] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +20: [2023-05-10 12:37:38,572] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +20: [2023-05-10 12:37:38,572] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +19: [2023-05-10 12:37:38,572] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +19: [2023-05-10 12:37:38,572] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +19: [2023-05-10 12:37:38,572] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +19: [2023-05-10 12:37:38,572] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +19: [2023-05-10 12:37:38,572] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +19: [2023-05-10 12:37:38,572] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +19: [2023-05-10 12:37:38,572] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +19: [2023-05-10 12:37:38,573] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +20: [2023-05-10 12:37:38,573] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +26: [2023-05-10 12:37:38,573] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt. +26: [2023-05-10 12:37:38,573] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt. +26: [2023-05-10 12:37:38,573] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt. +26: [2023-05-10 12:37:38,573] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt. +31: [2023-05-10 12:37:38,574] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +31: [2023-05-10 12:37:38,574] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... + 8: [2023-05-10 12:37:38,574] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. + 8: [2023-05-10 12:37:38,574] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +21: [2023-05-10 12:37:38,575] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +21: [2023-05-10 12:37:38,575] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +31: [2023-05-10 12:37:38,575] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +31: [2023-05-10 12:37:38,575] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +20: [2023-05-10 12:37:38,575] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +21: [2023-05-10 12:37:38,577] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... +21: [2023-05-10 12:37:38,577] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt... + 8: [2023-05-10 12:37:38,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt... + 8: [2023-05-10 12:37:38,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt... +26: [2023-05-10 12:37:38,578] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +30: [2023-05-10 12:37:38,579] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +22: [2023-05-10 12:37:38,579] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +26: [2023-05-10 12:37:38,580] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. + 8: [2023-05-10 12:37:38,580] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. + 8: [2023-05-10 12:37:38,580] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +28: [2023-05-10 12:37:38,581] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +29: [2023-05-10 12:37:38,583] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +26: [2023-05-10 12:37:38,584] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +26: [2023-05-10 12:37:38,584] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... + 8: [2023-05-10 12:37:38,584] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt... + 8: [2023-05-10 12:37:38,584] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt... +20: [2023-05-10 12:37:38,584] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +19: [2023-05-10 12:37:38,585] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +19: [2023-05-10 12:37:38,585] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt. +19: [2023-05-10 12:37:38,585] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt. +19: [2023-05-10 12:37:38,585] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt. +30: [2023-05-10 12:37:38,585] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +19: [2023-05-10 12:37:38,585] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +31: [2023-05-10 12:37:38,585] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +20: [2023-05-10 12:37:38,586] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt... +19: [2023-05-10 12:37:38,586] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt. +26: [2023-05-10 12:37:38,586] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +26: [2023-05-10 12:37:38,586] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +20: [2023-05-10 12:37:38,586] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +20: [2023-05-10 12:37:38,586] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt... +31: [2023-05-10 12:37:38,586] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt... +30: [2023-05-10 12:37:38,586] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +30: [2023-05-10 12:37:38,586] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +29: [2023-05-10 12:37:38,587] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +29: [2023-05-10 12:37:38,587] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +22: [2023-05-10 12:37:38,587] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +22: [2023-05-10 12:37:38,587] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +26: [2023-05-10 12:37:38,588] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +26: [2023-05-10 12:37:38,588] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +22: [2023-05-10 12:37:38,588] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +20: [2023-05-10 12:37:38,588] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +20: [2023-05-10 12:37:38,588] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt... +26: [2023-05-10 12:37:38,589] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +28: [2023-05-10 12:37:38,589] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +28: [2023-05-10 12:37:38,589] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +28: [2023-05-10 12:37:38,590] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +29: [2023-05-10 12:37:38,590] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +26: [2023-05-10 12:37:38,590] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +19: [2023-05-10 12:37:38,590] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +19: [2023-05-10 12:37:38,590] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +20: [2023-05-10 12:37:38,590] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +20: [2023-05-10 12:37:38,590] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt... +28: [2023-05-10 12:37:38,592] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt. +28: [2023-05-10 12:37:38,592] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt. +30: [2023-05-10 12:37:38,592] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +31: [2023-05-10 12:37:38,591] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +31: [2023-05-10 12:37:38,591] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt... +28: [2023-05-10 12:37:38,592] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt. +22: [2023-05-10 12:37:38,593] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +28: [2023-05-10 12:37:38,593] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +29: [2023-05-10 12:37:38,595] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +31: [2023-05-10 12:37:38,596] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +28: [2023-05-10 12:37:38,596] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt. +31: [2023-05-10 12:37:38,596] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt... +31: [2023-05-10 12:37:38,597] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +19: [2023-05-10 12:37:38,597] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +31: [2023-05-10 12:37:38,597] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt... +22: [2023-05-10 12:37:38,597] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +26: [2023-05-10 12:37:38,598] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +19: [2023-05-10 12:37:38,598] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +26: [2023-05-10 12:37:38,599] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +29: [2023-05-10 12:37:38,599] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +29: [2023-05-10 12:37:38,599] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +30: [2023-05-10 12:37:38,600] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +29: [2023-05-10 12:37:38,600] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +19: [2023-05-10 12:37:38,601] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +19: [2023-05-10 12:37:38,601] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +19: [2023-05-10 12:37:38,601] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +22: [2023-05-10 12:37:38,601] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +26: [2023-05-10 12:37:38,601] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt... +22: [2023-05-10 12:37:38,601] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +28: [2023-05-10 12:37:38,601] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +19: [2023-05-10 12:37:38,602] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +21: [2023-05-10 12:37:38,602] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +21: [2023-05-10 12:37:38,602] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +19: [2023-05-10 12:37:38,602] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +19: [2023-05-10 12:37:38,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +28: [2023-05-10 12:37:38,604] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +30: [2023-05-10 12:37:38,604] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +28: [2023-05-10 12:37:38,604] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +30: [2023-05-10 12:37:38,604] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +28: [2023-05-10 12:37:38,605] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +28: [2023-05-10 12:37:38,605] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +26: [2023-05-10 12:37:38,605] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +21: [2023-05-10 12:37:38,605] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt... +21: [2023-05-10 12:37:38,605] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt... +26: [2023-05-10 12:37:38,606] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +26: [2023-05-10 12:37:38,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt... +28: [2023-05-10 12:37:38,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +21: [2023-05-10 12:37:38,607] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +21: [2023-05-10 12:37:38,607] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_00-model_states.pt. +28: [2023-05-10 12:37:38,608] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +21: [2023-05-10 12:37:38,610] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt... +21: [2023-05-10 12:37:38,610] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt... +26: [2023-05-10 12:37:38,610] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +26: [2023-05-10 12:37:38,610] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt... +26: [2023-05-10 12:37:38,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +26: [2023-05-10 12:37:38,611] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt... +19: [2023-05-10 12:37:38,614] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +19: [2023-05-10 12:37:38,615] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt... +19: [2023-05-10 12:37:38,618] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +19: [2023-05-10 12:37:38,618] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +19: [2023-05-10 12:37:38,618] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt... +19: [2023-05-10 12:37:38,618] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt... +28: [2023-05-10 12:37:38,619] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +28: [2023-05-10 12:37:38,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt... +28: [2023-05-10 12:37:38,621] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +28: [2023-05-10 12:37:38,621] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt... +28: [2023-05-10 12:37:38,621] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +28: [2023-05-10 12:37:38,621] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt... +28: [2023-05-10 12:37:38,626] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +28: [2023-05-10 12:37:38,626] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt... +19: [2023-05-10 12:37:38,627] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +19: [2023-05-10 12:37:38,628] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt... +29: [2023-05-10 12:37:38,650] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt. +29: [2023-05-10 12:37:38,650] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt. +29: [2023-05-10 12:37:38,650] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt. +29: [2023-05-10 12:37:38,651] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt. +14: [2023-05-10 12:37:38,655] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt. +14: [2023-05-10 12:37:38,655] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt. +14: [2023-05-10 12:37:38,655] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt. +14: [2023-05-10 12:37:38,655] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt. +24: [2023-05-10 12:37:38,658] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt. +24: [2023-05-10 12:37:38,658] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt. +24: [2023-05-10 12:37:38,659] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt. +24: [2023-05-10 12:37:38,659] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt. +29: [2023-05-10 12:37:38,660] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +29: [2023-05-10 12:37:38,660] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +29: [2023-05-10 12:37:38,660] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +29: [2023-05-10 12:37:38,660] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +16: [2023-05-10 12:37:38,661] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt. +16: [2023-05-10 12:37:38,661] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt. +16: [2023-05-10 12:37:38,661] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt. +16: [2023-05-10 12:37:38,662] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt. +14: [2023-05-10 12:37:38,665] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +14: [2023-05-10 12:37:38,665] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +14: [2023-05-10 12:37:38,665] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +14: [2023-05-10 12:37:38,667] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +24: [2023-05-10 12:37:38,668] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +24: [2023-05-10 12:37:38,668] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +24: [2023-05-10 12:37:38,668] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +24: [2023-05-10 12:37:38,669] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +17: [2023-05-10 12:37:38,669] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt. +17: [2023-05-10 12:37:38,669] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt. +17: [2023-05-10 12:37:38,669] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt. +17: [2023-05-10 12:37:38,669] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt. +16: [2023-05-10 12:37:38,675] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +16: [2023-05-10 12:37:38,675] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +16: [2023-05-10 12:37:38,675] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +29: [2023-05-10 12:37:38,674] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +29: [2023-05-10 12:37:38,675] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt... +29: [2023-05-10 12:37:38,676] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +29: [2023-05-10 12:37:38,677] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt... +29: [2023-05-10 12:37:38,677] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +29: [2023-05-10 12:37:38,677] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt... +16: [2023-05-10 12:37:38,677] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +17: [2023-05-10 12:37:38,680] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +17: [2023-05-10 12:37:38,680] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... + 2: [2023-05-10 12:37:38,680] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt. +17: [2023-05-10 12:37:38,680] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +17: [2023-05-10 12:37:38,680] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... + 2: [2023-05-10 12:37:38,680] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt. + 2: [2023-05-10 12:37:38,680] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt. + 2: [2023-05-10 12:37:38,680] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt. +29: [2023-05-10 12:37:38,680] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +29: [2023-05-10 12:37:38,680] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt... +11: [2023-05-10 12:37:38,687] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +11: [2023-05-10 12:37:38,687] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +11: [2023-05-10 12:37:38,687] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +11: [2023-05-10 12:37:38,688] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +11: [2023-05-10 12:37:38,689] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +11: [2023-05-10 12:37:38,689] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +11: [2023-05-10 12:37:38,689] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +11: [2023-05-10 12:37:38,689] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +12: [2023-05-10 12:37:38,690] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt. +12: [2023-05-10 12:37:38,690] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt. +12: [2023-05-10 12:37:38,690] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt. +12: [2023-05-10 12:37:38,690] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt. + 2: [2023-05-10 12:37:38,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... + 2: [2023-05-10 12:37:38,691] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... + 2: [2023-05-10 12:37:38,691] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... + 2: [2023-05-10 12:37:38,691] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... + 6: [2023-05-10 12:37:38,691] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt. + 6: [2023-05-10 12:37:38,691] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt. + 6: [2023-05-10 12:37:38,691] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt. + 6: [2023-05-10 12:37:38,692] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt. + 7: [2023-05-10 12:37:38,693] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt. + 7: [2023-05-10 12:37:38,693] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt. + 7: [2023-05-10 12:37:38,693] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt. + 7: [2023-05-10 12:37:38,693] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt. + 4: [2023-05-10 12:37:38,695] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt. + 4: [2023-05-10 12:37:38,695] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt. +10: [2023-05-10 12:37:38,696] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +10: [2023-05-10 12:37:38,696] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +10: [2023-05-10 12:37:38,696] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +10: [2023-05-10 12:37:38,696] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... + 4: [2023-05-10 12:37:38,695] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt. +10: [2023-05-10 12:37:38,696] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. + 4: [2023-05-10 12:37:38,695] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt. +10: [2023-05-10 12:37:38,696] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +10: [2023-05-10 12:37:38,697] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +10: [2023-05-10 12:37:38,697] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +16: [2023-05-10 12:37:38,698] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +16: [2023-05-10 12:37:38,698] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +16: [2023-05-10 12:37:38,698] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +16: [2023-05-10 12:37:38,698] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +16: [2023-05-10 12:37:38,698] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +16: [2023-05-10 12:37:38,698] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +16: [2023-05-10 12:37:38,698] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +16: [2023-05-10 12:37:38,698] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +16: [2023-05-10 12:37:38,699] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +16: [2023-05-10 12:37:38,699] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +16: [2023-05-10 12:37:38,699] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +16: [2023-05-10 12:37:38,699] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +16: [2023-05-10 12:37:38,699] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt... +16: [2023-05-10 12:37:38,699] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt... +16: [2023-05-10 12:37:38,699] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt... +16: [2023-05-10 12:37:38,699] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt... +12: [2023-05-10 12:37:38,699] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +12: [2023-05-10 12:37:38,700] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +18: [2023-05-10 12:37:38,699] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt. +18: [2023-05-10 12:37:38,699] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt. +18: [2023-05-10 12:37:38,699] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt. +18: [2023-05-10 12:37:38,700] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt. +12: [2023-05-10 12:37:38,701] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +15: [2023-05-10 12:37:38,701] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt. +15: [2023-05-10 12:37:38,701] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt. +12: [2023-05-10 12:37:38,701] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +15: [2023-05-10 12:37:38,701] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt. + 6: [2023-05-10 12:37:38,702] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... + 6: [2023-05-10 12:37:38,702] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... + 6: [2023-05-10 12:37:38,702] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... + 7: [2023-05-10 12:37:38,702] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... + 6: [2023-05-10 12:37:38,702] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... + 7: [2023-05-10 12:37:38,702] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +15: [2023-05-10 12:37:38,703] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt. +11: [2023-05-10 12:37:38,703] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +11: [2023-05-10 12:37:38,703] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. + 7: [2023-05-10 12:37:38,704] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +11: [2023-05-10 12:37:38,704] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +11: [2023-05-10 12:37:38,704] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. + 7: [2023-05-10 12:37:38,705] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... + 4: [2023-05-10 12:37:38,705] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... + 4: [2023-05-10 12:37:38,705] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... + 4: [2023-05-10 12:37:38,705] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... + 4: [2023-05-10 12:37:38,705] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +25: [2023-05-10 12:37:38,705] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +25: [2023-05-10 12:37:38,706] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +25: [2023-05-10 12:37:38,706] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +25: [2023-05-10 12:37:38,706] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +25: [2023-05-10 12:37:38,706] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +25: [2023-05-10 12:37:38,706] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +25: [2023-05-10 12:37:38,706] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +25: [2023-05-10 12:37:38,706] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +12: [2023-05-10 12:37:38,708] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +12: [2023-05-10 12:37:38,708] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +12: [2023-05-10 12:37:38,708] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +12: [2023-05-10 12:37:38,708] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +12: [2023-05-10 12:37:38,708] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +12: [2023-05-10 12:37:38,708] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +10: [2023-05-10 12:37:38,708] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +12: [2023-05-10 12:37:38,709] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +12: [2023-05-10 12:37:38,709] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +18: [2023-05-10 12:37:38,709] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +18: [2023-05-10 12:37:38,710] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +16: [2023-05-10 12:37:38,709] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +18: [2023-05-10 12:37:38,710] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +18: [2023-05-10 12:37:38,710] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +16: [2023-05-10 12:37:38,712] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +15: [2023-05-10 12:37:38,713] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +12: [2023-05-10 12:37:38,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +15: [2023-05-10 12:37:38,713] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +15: [2023-05-10 12:37:38,713] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +12: [2023-05-10 12:37:38,714] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt... +16: [2023-05-10 12:37:38,715] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +16: [2023-05-10 12:37:38,715] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +11: [2023-05-10 12:37:38,716] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +10: [2023-05-10 12:37:38,715] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +10: [2023-05-10 12:37:38,715] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +10: [2023-05-10 12:37:38,716] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +15: [2023-05-10 12:37:38,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +11: [2023-05-10 12:37:38,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +11: [2023-05-10 12:37:38,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +11: [2023-05-10 12:37:38,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +25: [2023-05-10 12:37:38,717] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +25: [2023-05-10 12:37:38,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +12: [2023-05-10 12:37:38,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +12: [2023-05-10 12:37:38,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt... +10: [2023-05-10 12:37:38,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +12: [2023-05-10 12:37:38,720] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +12: [2023-05-10 12:37:38,720] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt... +25: [2023-05-10 12:37:38,721] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +25: [2023-05-10 12:37:38,722] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +16: [2023-05-10 12:37:38,723] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +12: [2023-05-10 12:37:38,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +12: [2023-05-10 12:37:38,723] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt... + 6: [2023-05-10 12:37:38,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. + 6: [2023-05-10 12:37:38,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. + 6: [2023-05-10 12:37:38,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. + 6: [2023-05-10 12:37:38,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. + 6: [2023-05-10 12:37:38,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... + 6: [2023-05-10 12:37:38,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... + 6: [2023-05-10 12:37:38,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. + 6: [2023-05-10 12:37:38,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. + 6: [2023-05-10 12:37:38,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. + 6: [2023-05-10 12:37:38,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... + 6: [2023-05-10 12:37:38,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. + 6: [2023-05-10 12:37:38,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt... + 6: [2023-05-10 12:37:38,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt... + 6: [2023-05-10 12:37:38,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt... + 6: [2023-05-10 12:37:38,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt... + 6: [2023-05-10 12:37:38,726] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +12: [2023-05-10 12:37:38,726] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +16: [2023-05-10 12:37:38,727] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +16: [2023-05-10 12:37:38,727] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +12: [2023-05-10 12:37:38,728] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +12: [2023-05-10 12:37:38,728] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +16: [2023-05-10 12:37:38,728] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +25: [2023-05-10 12:37:38,729] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +25: [2023-05-10 12:37:38,729] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +10: [2023-05-10 12:37:38,729] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +10: [2023-05-10 12:37:38,731] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +25: [2023-05-10 12:37:38,732] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +10: [2023-05-10 12:37:38,732] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +25: [2023-05-10 12:37:38,733] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +12: [2023-05-10 12:37:38,733] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +12: [2023-05-10 12:37:38,739] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +12: [2023-05-10 12:37:38,740] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +12: [2023-05-10 12:37:38,740] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... + 6: [2023-05-10 12:37:38,740] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. + 6: [2023-05-10 12:37:38,740] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. + 6: [2023-05-10 12:37:38,740] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +12: [2023-05-10 12:37:38,742] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +31: [2023-05-10 12:37:38,747] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +31: [2023-05-10 12:37:38,748] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +31: [2023-05-10 12:37:38,748] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +31: [2023-05-10 12:37:38,748] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +17: [2023-05-10 12:37:38,748] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +17: [2023-05-10 12:37:38,748] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +17: [2023-05-10 12:37:38,748] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +17: [2023-05-10 12:37:38,748] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +17: [2023-05-10 12:37:38,748] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +17: [2023-05-10 12:37:38,748] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +17: [2023-05-10 12:37:38,748] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +17: [2023-05-10 12:37:38,748] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +17: [2023-05-10 12:37:38,748] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +17: [2023-05-10 12:37:38,748] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +17: [2023-05-10 12:37:38,749] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +17: [2023-05-10 12:37:38,749] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +31: [2023-05-10 12:37:38,749] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +17: [2023-05-10 12:37:38,749] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt... +17: [2023-05-10 12:37:38,749] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt... +17: [2023-05-10 12:37:38,749] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt... +31: [2023-05-10 12:37:38,749] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +31: [2023-05-10 12:37:38,750] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... + 6: [2023-05-10 12:37:38,750] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +31: [2023-05-10 12:37:38,750] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +17: [2023-05-10 12:37:38,750] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt... +24: [2023-05-10 12:37:38,750] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +24: [2023-05-10 12:37:38,751] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +24: [2023-05-10 12:37:38,751] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +24: [2023-05-10 12:37:38,751] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +24: [2023-05-10 12:37:38,751] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +24: [2023-05-10 12:37:38,751] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +24: [2023-05-10 12:37:38,751] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +24: [2023-05-10 12:37:38,751] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +24: [2023-05-10 12:37:38,751] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +14: [2023-05-10 12:37:38,752] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +14: [2023-05-10 12:37:38,752] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +14: [2023-05-10 12:37:38,753] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +14: [2023-05-10 12:37:38,753] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +14: [2023-05-10 12:37:38,753] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +14: [2023-05-10 12:37:38,753] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +14: [2023-05-10 12:37:38,753] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +14: [2023-05-10 12:37:38,753] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. + 6: [2023-05-10 12:37:38,753] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... + 6: [2023-05-10 12:37:38,753] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +14: [2023-05-10 12:37:38,753] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +14: [2023-05-10 12:37:38,753] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +14: [2023-05-10 12:37:38,753] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +14: [2023-05-10 12:37:38,753] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +14: [2023-05-10 12:37:38,753] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt... +14: [2023-05-10 12:37:38,753] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt... +14: [2023-05-10 12:37:38,753] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt... +14: [2023-05-10 12:37:38,753] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt... + 6: [2023-05-10 12:37:38,753] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +17: [2023-05-10 12:37:38,760] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +17: [2023-05-10 12:37:38,761] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. + 6: [2023-05-10 12:37:38,762] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +30: [2023-05-10 12:37:38,764] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt. +30: [2023-05-10 12:37:38,764] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt. +30: [2023-05-10 12:37:38,765] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt. +30: [2023-05-10 12:37:38,765] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt. +14: [2023-05-10 12:37:38,765] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +17: [2023-05-10 12:37:38,765] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +17: [2023-05-10 12:37:38,765] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +14: [2023-05-10 12:37:38,766] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. + 5: [2023-05-10 12:37:38,768] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt. + 5: [2023-05-10 12:37:38,768] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt. + 5: [2023-05-10 12:37:38,768] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt. + 1: [2023-05-10 12:37:38,768] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt. + 1: [2023-05-10 12:37:38,768] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt. + 5: [2023-05-10 12:37:38,768] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt. + 1: [2023-05-10 12:37:38,768] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt. +27: [2023-05-10 12:37:38,768] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt. +27: [2023-05-10 12:37:38,768] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt. +27: [2023-05-10 12:37:38,768] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt. + 1: [2023-05-10 12:37:38,768] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt. +27: [2023-05-10 12:37:38,769] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt. +25: [2023-05-10 12:37:38,769] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt. +25: [2023-05-10 12:37:38,769] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt. +25: [2023-05-10 12:37:38,769] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt. +14: [2023-05-10 12:37:38,769] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +14: [2023-05-10 12:37:38,769] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +25: [2023-05-10 12:37:38,769] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt. +13: [2023-05-10 12:37:38,769] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt. +13: [2023-05-10 12:37:38,769] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt. +13: [2023-05-10 12:37:38,769] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt. +13: [2023-05-10 12:37:38,770] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt. +10: [2023-05-10 12:37:38,770] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt. +10: [2023-05-10 12:37:38,770] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt. +10: [2023-05-10 12:37:38,770] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt. +10: [2023-05-10 12:37:38,770] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt. + 0: [2023-05-10 12:37:38,770] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt. +17: [2023-05-10 12:37:38,771] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... + 0: [2023-05-10 12:37:38,771] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt. + 0: [2023-05-10 12:37:38,771] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt. + 0: [2023-05-10 12:37:38,771] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt. + 9: [2023-05-10 12:37:38,771] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt. + 9: [2023-05-10 12:37:38,772] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt. + 9: [2023-05-10 12:37:38,772] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt. + 9: [2023-05-10 12:37:38,772] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt. +23: [2023-05-10 12:37:38,773] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt. +23: [2023-05-10 12:37:38,773] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt. +23: [2023-05-10 12:37:38,773] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt. +23: [2023-05-10 12:37:38,773] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt. +17: [2023-05-10 12:37:38,774] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +17: [2023-05-10 12:37:38,774] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... + 8: [2023-05-10 12:37:38,774] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt. + 8: [2023-05-10 12:37:38,774] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt. + 8: [2023-05-10 12:37:38,774] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt. +17: [2023-05-10 12:37:38,775] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +11: [2023-05-10 12:37:38,774] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt. +11: [2023-05-10 12:37:38,774] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt. +11: [2023-05-10 12:37:38,774] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt. +21: [2023-05-10 12:37:38,775] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt. +21: [2023-05-10 12:37:38,775] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt. + 8: [2023-05-10 12:37:38,775] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt. +11: [2023-05-10 12:37:38,775] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt. +21: [2023-05-10 12:37:38,775] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt. +21: [2023-05-10 12:37:38,775] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt. +31: [2023-05-10 12:37:38,775] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +30: [2023-05-10 12:37:38,776] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +30: [2023-05-10 12:37:38,776] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +30: [2023-05-10 12:37:38,777] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +30: [2023-05-10 12:37:38,777] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... + 3: [2023-05-10 12:37:38,777] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt. + 3: [2023-05-10 12:37:38,777] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt. + 3: [2023-05-10 12:37:38,777] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt. + 1: [2023-05-10 12:37:38,778] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... + 3: [2023-05-10 12:37:38,778] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_04-model_01-model_states.pt. + 3: [2023-05-10 12:37:38,778] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. + 3: [2023-05-10 12:37:38,778] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. + 3: [2023-05-10 12:37:38,778] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +14: [2023-05-10 12:37:38,778] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +31: [2023-05-10 12:37:38,779] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +31: [2023-05-10 12:37:38,779] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +31: [2023-05-10 12:37:38,779] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +14: [2023-05-10 12:37:38,779] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +25: [2023-05-10 12:37:38,779] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +25: [2023-05-10 12:37:38,779] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... + 1: [2023-05-10 12:37:38,780] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... + 1: [2023-05-10 12:37:38,780] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... + 1: [2023-05-10 12:37:38,780] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +25: [2023-05-10 12:37:38,780] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +25: [2023-05-10 12:37:38,780] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +27: [2023-05-10 12:37:38,780] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +27: [2023-05-10 12:37:38,780] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +27: [2023-05-10 12:37:38,780] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +13: [2023-05-10 12:37:38,780] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +27: [2023-05-10 12:37:38,780] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +13: [2023-05-10 12:37:38,781] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +10: [2023-05-10 12:37:38,781] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... + 3: [2023-05-10 12:37:38,781] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. + 5: [2023-05-10 12:37:38,781] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +10: [2023-05-10 12:37:38,781] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... + 3: [2023-05-10 12:37:38,781] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. + 3: [2023-05-10 12:37:38,781] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... + 5: [2023-05-10 12:37:38,782] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... + 5: [2023-05-10 12:37:38,782] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... + 9: [2023-05-10 12:37:38,782] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... + 5: [2023-05-10 12:37:38,782] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +14: [2023-05-10 12:37:38,782] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +14: [2023-05-10 12:37:38,782] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +10: [2023-05-10 12:37:38,782] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... + 3: [2023-05-10 12:37:38,783] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +10: [2023-05-10 12:37:38,784] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +13: [2023-05-10 12:37:38,784] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... + 0: [2023-05-10 12:37:38,784] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +13: [2023-05-10 12:37:38,784] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +11: [2023-05-10 12:37:38,784] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... + 0: [2023-05-10 12:37:38,785] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +31: [2023-05-10 12:37:38,785] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... + 0: [2023-05-10 12:37:38,785] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... + 9: [2023-05-10 12:37:38,785] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... + 8: [2023-05-10 12:37:38,785] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... + 8: [2023-05-10 12:37:38,785] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +23: [2023-05-10 12:37:38,782] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +23: [2023-05-10 12:37:38,782] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +23: [2023-05-10 12:37:38,783] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +23: [2023-05-10 12:37:38,783] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +11: [2023-05-10 12:37:38,785] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... + 0: [2023-05-10 12:37:38,786] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +21: [2023-05-10 12:37:38,786] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +11: [2023-05-10 12:37:38,786] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... + 3: [2023-05-10 12:37:38,786] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +11: [2023-05-10 12:37:38,786] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +21: [2023-05-10 12:37:38,786] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... + 8: [2023-05-10 12:37:38,787] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... + 8: [2023-05-10 12:37:38,787] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +21: [2023-05-10 12:37:38,787] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +21: [2023-05-10 12:37:38,787] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... + 9: [2023-05-10 12:37:38,787] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +31: [2023-05-10 12:37:38,788] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +31: [2023-05-10 12:37:38,788] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... + 9: [2023-05-10 12:37:38,788] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +31: [2023-05-10 12:37:38,788] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +30: [2023-05-10 12:37:38,788] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +30: [2023-05-10 12:37:38,789] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt... +22: [2023-05-10 12:37:38,789] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +22: [2023-05-10 12:37:38,789] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +22: [2023-05-10 12:37:38,789] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +22: [2023-05-10 12:37:38,790] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +22: [2023-05-10 12:37:38,790] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +24: [2023-05-10 12:37:38,751] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +24: [2023-05-10 12:37:38,751] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +24: [2023-05-10 12:37:38,751] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt... +24: [2023-05-10 12:37:38,751] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +24: [2023-05-10 12:37:38,751] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt... +24: [2023-05-10 12:37:38,751] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt... +24: [2023-05-10 12:37:38,751] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt... +24: [2023-05-10 12:37:38,763] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +24: [2023-05-10 12:37:38,764] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +24: [2023-05-10 12:37:38,767] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +24: [2023-05-10 12:37:38,767] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +24: [2023-05-10 12:37:38,779] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +24: [2023-05-10 12:37:38,782] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +24: [2023-05-10 12:37:38,782] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +24: [2023-05-10 12:37:38,786] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +22: [2023-05-10 12:37:38,792] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... + 3: [2023-05-10 12:37:38,791] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +22: [2023-05-10 12:37:38,792] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +22: [2023-05-10 12:37:38,792] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... + 3: [2023-05-10 12:37:38,792] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... + 3: [2023-05-10 12:37:38,792] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +30: [2023-05-10 12:37:38,792] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +30: [2023-05-10 12:37:38,792] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +30: [2023-05-10 12:37:38,792] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt... +30: [2023-05-10 12:37:38,792] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt... + 3: [2023-05-10 12:37:38,794] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +25: [2023-05-10 12:37:38,796] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +25: [2023-05-10 12:37:38,796] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +25: [2023-05-10 12:37:38,797] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt... +25: [2023-05-10 12:37:38,797] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt... +10: [2023-05-10 12:37:38,797] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +10: [2023-05-10 12:37:38,797] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +11: [2023-05-10 12:37:38,797] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. + 3: [2023-05-10 12:37:38,797] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +23: [2023-05-10 12:37:38,798] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +11: [2023-05-10 12:37:38,798] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt... +23: [2023-05-10 12:37:38,798] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt... +10: [2023-05-10 12:37:38,799] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +25: [2023-05-10 12:37:38,799] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +10: [2023-05-10 12:37:38,799] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt... +25: [2023-05-10 12:37:38,799] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt... +10: [2023-05-10 12:37:38,799] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt... +10: [2023-05-10 12:37:38,799] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt... +10: [2023-05-10 12:37:38,799] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +10: [2023-05-10 12:37:38,799] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt... + 3: [2023-05-10 12:37:38,799] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +23: [2023-05-10 12:37:38,801] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +23: [2023-05-10 12:37:38,801] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +11: [2023-05-10 12:37:38,800] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +11: [2023-05-10 12:37:38,800] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +11: [2023-05-10 12:37:38,801] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt... +11: [2023-05-10 12:37:38,801] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt... +23: [2023-05-10 12:37:38,801] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt... +23: [2023-05-10 12:37:38,801] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt... +25: [2023-05-10 12:37:38,800] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +25: [2023-05-10 12:37:38,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt... +30: [2023-05-10 12:37:38,801] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +11: [2023-05-10 12:37:38,802] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +11: [2023-05-10 12:37:38,802] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt... +30: [2023-05-10 12:37:38,804] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt... +23: [2023-05-10 12:37:38,804] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +23: [2023-05-10 12:37:38,804] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt... +22: [2023-05-10 12:37:38,806] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +20: [2023-05-10 12:37:38,807] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +20: [2023-05-10 12:37:38,807] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +20: [2023-05-10 12:37:38,808] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +20: [2023-05-10 12:37:38,808] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +20: [2023-05-10 12:37:38,808] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +20: [2023-05-10 12:37:38,808] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +20: [2023-05-10 12:37:38,808] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +22: [2023-05-10 12:37:38,808] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt. +22: [2023-05-10 12:37:38,808] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt. +22: [2023-05-10 12:37:38,808] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt. +22: [2023-05-10 12:37:38,808] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt. +20: [2023-05-10 12:37:38,809] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +27: [2023-05-10 12:37:38,810] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +27: [2023-05-10 12:37:38,811] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +27: [2023-05-10 12:37:38,811] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +27: [2023-05-10 12:37:38,811] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +27: [2023-05-10 12:37:38,811] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +27: [2023-05-10 12:37:38,811] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt... +27: [2023-05-10 12:37:38,811] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +27: [2023-05-10 12:37:38,811] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +27: [2023-05-10 12:37:38,811] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +27: [2023-05-10 12:37:38,811] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +27: [2023-05-10 12:37:38,811] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt... +27: [2023-05-10 12:37:38,811] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +27: [2023-05-10 12:37:38,811] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt... +27: [2023-05-10 12:37:38,811] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt... +27: [2023-05-10 12:37:38,811] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +27: [2023-05-10 12:37:38,811] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... + 3: [2023-05-10 12:37:38,813] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... + 3: [2023-05-10 12:37:38,813] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... + 3: [2023-05-10 12:37:38,814] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. + 3: [2023-05-10 12:37:38,814] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt... + 3: [2023-05-10 12:37:38,815] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. + 3: [2023-05-10 12:37:38,815] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt... + 3: [2023-05-10 12:37:38,816] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. + 3: [2023-05-10 12:37:38,816] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt... +22: [2023-05-10 12:37:38,818] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... + 4: [2023-05-10 12:37:38,819] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. + 4: [2023-05-10 12:37:38,819] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. + 4: [2023-05-10 12:37:38,819] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. + 4: [2023-05-10 12:37:38,819] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. + 4: [2023-05-10 12:37:38,819] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. + 4: [2023-05-10 12:37:38,819] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. + 4: [2023-05-10 12:37:38,819] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. + 4: [2023-05-10 12:37:38,819] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... + 4: [2023-05-10 12:37:38,819] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... + 4: [2023-05-10 12:37:38,820] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... + 4: [2023-05-10 12:37:38,820] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. + 4: [2023-05-10 12:37:38,820] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... + 4: [2023-05-10 12:37:38,820] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt... + 4: [2023-05-10 12:37:38,820] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt... + 4: [2023-05-10 12:37:38,820] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt... + 4: [2023-05-10 12:37:38,820] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt... + 3: [2023-05-10 12:37:38,821] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. + 3: [2023-05-10 12:37:38,821] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt... +22: [2023-05-10 12:37:38,822] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +20: [2023-05-10 12:37:38,821] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +20: [2023-05-10 12:37:38,822] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +20: [2023-05-10 12:37:38,822] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +22: [2023-05-10 12:37:38,822] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +28: [2023-05-10 12:37:38,822] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt. +28: [2023-05-10 12:37:38,823] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt. +28: [2023-05-10 12:37:38,823] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt. +28: [2023-05-10 12:37:38,823] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt. +27: [2023-05-10 12:37:38,823] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +27: [2023-05-10 12:37:38,824] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. + 3: [2023-05-10 12:37:38,824] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +22: [2023-05-10 12:37:38,825] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +22: [2023-05-10 12:37:38,825] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +22: [2023-05-10 12:37:38,825] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... + 3: [2023-05-10 12:37:38,826] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +27: [2023-05-10 12:37:38,826] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +27: [2023-05-10 12:37:38,826] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +31: [2023-05-10 12:37:38,828] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt. +31: [2023-05-10 12:37:38,828] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt. +31: [2023-05-10 12:37:38,828] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt. +22: [2023-05-10 12:37:38,828] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +22: [2023-05-10 12:37:38,828] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +31: [2023-05-10 12:37:38,828] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt. +29: [2023-05-10 12:37:38,828] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +29: [2023-05-10 12:37:38,829] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +29: [2023-05-10 12:37:38,829] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +29: [2023-05-10 12:37:38,829] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +29: [2023-05-10 12:37:38,829] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +26: [2023-05-10 12:37:38,829] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt. +26: [2023-05-10 12:37:38,830] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt. +26: [2023-05-10 12:37:38,830] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt. +29: [2023-05-10 12:37:38,831] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +29: [2023-05-10 12:37:38,831] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +29: [2023-05-10 12:37:38,831] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... + 4: [2023-05-10 12:37:38,831] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. + 7: [2023-05-10 12:37:38,831] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. + 7: [2023-05-10 12:37:38,831] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +26: [2023-05-10 12:37:38,830] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt. + 7: [2023-05-10 12:37:38,832] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. + 7: [2023-05-10 12:37:38,832] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. + 7: [2023-05-10 12:37:38,832] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. + 7: [2023-05-10 12:37:38,832] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... + 7: [2023-05-10 12:37:38,832] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. + 7: [2023-05-10 12:37:38,832] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. + 7: [2023-05-10 12:37:38,832] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +20: [2023-05-10 12:37:38,832] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... + 7: [2023-05-10 12:37:38,832] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt... + 7: [2023-05-10 12:37:38,832] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt... + 7: [2023-05-10 12:37:38,832] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt... + 7: [2023-05-10 12:37:38,832] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... + 7: [2023-05-10 12:37:38,832] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... + 7: [2023-05-10 12:37:38,832] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. + 7: [2023-05-10 12:37:38,832] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt... +28: [2023-05-10 12:37:38,833] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +20: [2023-05-10 12:37:38,833] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +22: [2023-05-10 12:37:38,834] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +28: [2023-05-10 12:37:38,834] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +28: [2023-05-10 12:37:38,835] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +27: [2023-05-10 12:37:38,835] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +27: [2023-05-10 12:37:38,835] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +28: [2023-05-10 12:37:38,835] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +20: [2023-05-10 12:37:38,836] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... + 4: [2023-05-10 12:37:38,837] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +31: [2023-05-10 12:37:38,838] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... + 3: [2023-05-10 12:37:38,838] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... + 4: [2023-05-10 12:37:38,838] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. + 4: [2023-05-10 12:37:38,838] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +31: [2023-05-10 12:37:38,838] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... + 3: [2023-05-10 12:37:38,839] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +31: [2023-05-10 12:37:38,839] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +22: [2023-05-10 12:37:38,840] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +22: [2023-05-10 12:37:38,840] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +29: [2023-05-10 12:37:38,840] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +31: [2023-05-10 12:37:38,840] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +22: [2023-05-10 12:37:38,840] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +27: [2023-05-10 12:37:38,840] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +20: [2023-05-10 12:37:38,840] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +22: [2023-05-10 12:37:38,841] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt... +27: [2023-05-10 12:37:38,841] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... + 4: [2023-05-10 12:37:38,842] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +26: [2023-05-10 12:37:38,842] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +26: [2023-05-10 12:37:38,843] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +26: [2023-05-10 12:37:38,843] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +21: [2023-05-10 12:37:38,843] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +21: [2023-05-10 12:37:38,843] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +21: [2023-05-10 12:37:38,843] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +21: [2023-05-10 12:37:38,844] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +26: [2023-05-10 12:37:38,844] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +21: [2023-05-10 12:37:38,844] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt... +21: [2023-05-10 12:37:38,844] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt... +21: [2023-05-10 12:37:38,844] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +21: [2023-05-10 12:37:38,844] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +21: [2023-05-10 12:37:38,844] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +21: [2023-05-10 12:37:38,844] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +21: [2023-05-10 12:37:38,844] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +21: [2023-05-10 12:37:38,844] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +21: [2023-05-10 12:37:38,844] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt... +21: [2023-05-10 12:37:38,844] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +21: [2023-05-10 12:37:38,844] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt... +21: [2023-05-10 12:37:38,844] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... + 7: [2023-05-10 12:37:38,844] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +20: [2023-05-10 12:37:38,847] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt. +20: [2023-05-10 12:37:38,848] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt. +20: [2023-05-10 12:37:38,848] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt. +20: [2023-05-10 12:37:38,848] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt. + 4: [2023-05-10 12:37:38,849] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... + 4: [2023-05-10 12:37:38,849] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +20: [2023-05-10 12:37:38,850] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... + 4: [2023-05-10 12:37:38,851] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +29: [2023-05-10 12:37:38,851] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... + 7: [2023-05-10 12:37:38,851] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. + 7: [2023-05-10 12:37:38,851] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. + 7: [2023-05-10 12:37:38,851] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +31: [2023-05-10 12:37:38,853] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +31: [2023-05-10 12:37:38,853] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt... +31: [2023-05-10 12:37:38,854] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +31: [2023-05-10 12:37:38,854] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt... + 7: [2023-05-10 12:37:38,855] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +22: [2023-05-10 12:37:38,854] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +22: [2023-05-10 12:37:38,856] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +22: [2023-05-10 12:37:38,856] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +22: [2023-05-10 12:37:38,857] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt... +21: [2023-05-10 12:37:38,856] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +21: [2023-05-10 12:37:38,857] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +29: [2023-05-10 12:37:38,857] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +22: [2023-05-10 12:37:38,859] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt... +22: [2023-05-10 12:37:38,859] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt... +20: [2023-05-10 12:37:38,859] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +21: [2023-05-10 12:37:38,859] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +21: [2023-05-10 12:37:38,860] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +29: [2023-05-10 12:37:38,861] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +29: [2023-05-10 12:37:38,861] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. + 7: [2023-05-10 12:37:38,861] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +20: [2023-05-10 12:37:38,861] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +20: [2023-05-10 12:37:38,862] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... + 7: [2023-05-10 12:37:38,863] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +20: [2023-05-10 12:37:38,863] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... + 7: [2023-05-10 12:37:38,864] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +31: [2023-05-10 12:37:38,866] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +29: [2023-05-10 12:37:38,867] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +21: [2023-05-10 12:37:38,867] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +31: [2023-05-10 12:37:38,868] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt... +29: [2023-05-10 12:37:38,870] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +29: [2023-05-10 12:37:38,870] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +31: [2023-05-10 12:37:38,871] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +21: [2023-05-10 12:37:38,871] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +21: [2023-05-10 12:37:38,871] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +21: [2023-05-10 12:37:38,872] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +31: [2023-05-10 12:37:38,873] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt... +23: [2023-05-10 12:37:38,873] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +23: [2023-05-10 12:37:38,873] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +23: [2023-05-10 12:37:38,873] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +15: [2023-05-10 12:37:38,874] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +15: [2023-05-10 12:37:38,874] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +15: [2023-05-10 12:37:38,874] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +15: [2023-05-10 12:37:38,874] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +15: [2023-05-10 12:37:38,874] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +15: [2023-05-10 12:37:38,874] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +15: [2023-05-10 12:37:38,874] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +15: [2023-05-10 12:37:38,874] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +15: [2023-05-10 12:37:38,874] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +15: [2023-05-10 12:37:38,874] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +15: [2023-05-10 12:37:38,874] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +15: [2023-05-10 12:37:38,874] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +15: [2023-05-10 12:37:38,874] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt... +15: [2023-05-10 12:37:38,875] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt... +15: [2023-05-10 12:37:38,875] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt... +15: [2023-05-10 12:37:38,875] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt... +23: [2023-05-10 12:37:38,875] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +23: [2023-05-10 12:37:38,875] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +23: [2023-05-10 12:37:38,875] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +23: [2023-05-10 12:37:38,877] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +23: [2023-05-10 12:37:38,878] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... + 9: [2023-05-10 12:37:38,880] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. + 9: [2023-05-10 12:37:38,881] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. + 9: [2023-05-10 12:37:38,881] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... + 9: [2023-05-10 12:37:38,881] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... + 9: [2023-05-10 12:37:38,881] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. + 9: [2023-05-10 12:37:38,881] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. + 9: [2023-05-10 12:37:38,881] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... + 9: [2023-05-10 12:37:38,881] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. + 9: [2023-05-10 12:37:38,881] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. + 9: [2023-05-10 12:37:38,881] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. + 9: [2023-05-10 12:37:38,881] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. + 9: [2023-05-10 12:37:38,881] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt... + 9: [2023-05-10 12:37:38,881] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt... +19: [2023-05-10 12:37:38,881] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. + 9: [2023-05-10 12:37:38,881] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt... +19: [2023-05-10 12:37:38,882] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... + 9: [2023-05-10 12:37:38,881] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +19: [2023-05-10 12:37:38,883] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +19: [2023-05-10 12:37:38,883] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... + 9: [2023-05-10 12:37:38,883] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt... +23: [2023-05-10 12:37:38,884] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +19: [2023-05-10 12:37:38,884] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +19: [2023-05-10 12:37:38,884] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +19: [2023-05-10 12:37:38,885] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +19: [2023-05-10 12:37:38,886] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +19: [2023-05-10 12:37:38,887] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt. +20: [2023-05-10 12:37:38,886] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +19: [2023-05-10 12:37:38,887] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt. +15: [2023-05-10 12:37:38,887] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +19: [2023-05-10 12:37:38,887] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt. +19: [2023-05-10 12:37:38,887] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt. +20: [2023-05-10 12:37:38,889] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt... +20: [2023-05-10 12:37:38,889] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +15: [2023-05-10 12:37:38,891] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +23: [2023-05-10 12:37:38,892] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +20: [2023-05-10 12:37:38,891] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt... +20: [2023-05-10 12:37:38,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +20: [2023-05-10 12:37:38,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. + 6: [2023-05-10 12:37:38,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt. + 6: [2023-05-10 12:37:38,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt. + 6: [2023-05-10 12:37:38,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt. + 6: [2023-05-10 12:37:38,893] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt. + 9: [2023-05-10 12:37:38,893] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +15: [2023-05-10 12:37:38,893] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. + 9: [2023-05-10 12:37:38,893] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +15: [2023-05-10 12:37:38,893] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +20: [2023-05-10 12:37:38,894] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt... +20: [2023-05-10 12:37:38,895] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt... + 9: [2023-05-10 12:37:38,895] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. + 9: [2023-05-10 12:37:38,895] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. + 2: [2023-05-10 12:37:38,895] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. + 2: [2023-05-10 12:37:38,895] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. + 2: [2023-05-10 12:37:38,895] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. + 2: [2023-05-10 12:37:38,895] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. + 2: [2023-05-10 12:37:38,895] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. + 2: [2023-05-10 12:37:38,895] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. + 2: [2023-05-10 12:37:38,895] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. + 2: [2023-05-10 12:37:38,896] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... + 2: [2023-05-10 12:37:38,896] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... + 2: [2023-05-10 12:37:38,896] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... + 2: [2023-05-10 12:37:38,896] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... + 2: [2023-05-10 12:37:38,896] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. + 2: [2023-05-10 12:37:38,896] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt... + 2: [2023-05-10 12:37:38,896] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt... + 2: [2023-05-10 12:37:38,896] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt... + 2: [2023-05-10 12:37:38,896] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt... +19: [2023-05-10 12:37:38,896] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +13: [2023-05-10 12:37:38,897] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +19: [2023-05-10 12:37:38,898] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +13: [2023-05-10 12:37:38,898] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +13: [2023-05-10 12:37:38,898] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +13: [2023-05-10 12:37:38,898] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +15: [2023-05-10 12:37:38,898] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +13: [2023-05-10 12:37:38,898] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt... +13: [2023-05-10 12:37:38,898] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt... +13: [2023-05-10 12:37:38,898] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +13: [2023-05-10 12:37:38,898] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +13: [2023-05-10 12:37:38,898] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +13: [2023-05-10 12:37:38,898] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +13: [2023-05-10 12:37:38,899] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt... +13: [2023-05-10 12:37:38,899] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt... +13: [2023-05-10 12:37:38,899] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +13: [2023-05-10 12:37:38,899] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +13: [2023-05-10 12:37:38,899] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +19: [2023-05-10 12:37:38,899] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +13: [2023-05-10 12:37:38,899] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +26: [2023-05-10 12:37:38,899] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. + 5: [2023-05-10 12:37:38,899] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. + 5: [2023-05-10 12:37:38,899] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. + 5: [2023-05-10 12:37:38,899] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. + 5: [2023-05-10 12:37:38,899] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +26: [2023-05-10 12:37:38,899] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +26: [2023-05-10 12:37:38,899] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +26: [2023-05-10 12:37:38,899] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... + 5: [2023-05-10 12:37:38,899] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +26: [2023-05-10 12:37:38,899] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +26: [2023-05-10 12:37:38,899] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +26: [2023-05-10 12:37:38,899] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. + 5: [2023-05-10 12:37:38,900] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt... + 0: [2023-05-10 12:37:38,900] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. + 5: [2023-05-10 12:37:38,900] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt... + 5: [2023-05-10 12:37:38,900] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. + 5: [2023-05-10 12:37:38,900] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. + 5: [2023-05-10 12:37:38,900] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. + 5: [2023-05-10 12:37:38,900] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. + 5: [2023-05-10 12:37:38,900] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt... +19: [2023-05-10 12:37:38,900] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... + 5: [2023-05-10 12:37:38,900] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... + 5: [2023-05-10 12:37:38,900] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... + 0: [2023-05-10 12:37:38,900] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt... +26: [2023-05-10 12:37:38,900] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +26: [2023-05-10 12:37:38,900] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +26: [2023-05-10 12:37:38,900] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +19: [2023-05-10 12:37:38,900] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +26: [2023-05-10 12:37:38,901] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... + 0: [2023-05-10 12:37:38,901] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. + 0: [2023-05-10 12:37:38,901] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. + 8: [2023-05-10 12:37:38,901] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. + 0: [2023-05-10 12:37:38,901] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. + 0: [2023-05-10 12:37:38,901] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. + 0: [2023-05-10 12:37:38,901] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. + 8: [2023-05-10 12:37:38,901] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. + 0: [2023-05-10 12:37:38,901] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. + 8: [2023-05-10 12:37:38,901] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. + 0: [2023-05-10 12:37:38,901] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt... + 0: [2023-05-10 12:37:38,901] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... + 0: [2023-05-10 12:37:38,901] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... + 8: [2023-05-10 12:37:38,901] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... + 0: [2023-05-10 12:37:38,901] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... + 0: [2023-05-10 12:37:38,901] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt... +23: [2023-05-10 12:37:38,901] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. + 0: [2023-05-10 12:37:38,901] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt... + 0: [2023-05-10 12:37:38,901] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. + 8: [2023-05-10 12:37:38,901] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. + 8: [2023-05-10 12:37:38,901] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. + 0: [2023-05-10 12:37:38,901] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... + 8: [2023-05-10 12:37:38,901] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... + 8: [2023-05-10 12:37:38,901] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. + 8: [2023-05-10 12:37:38,901] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... + 8: [2023-05-10 12:37:38,901] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. + 8: [2023-05-10 12:37:38,901] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. + 8: [2023-05-10 12:37:38,902] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... + 8: [2023-05-10 12:37:38,902] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt... + 8: [2023-05-10 12:37:38,902] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt... + 5: [2023-05-10 12:37:38,902] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... + 8: [2023-05-10 12:37:38,902] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt... + 8: [2023-05-10 12:37:38,902] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt... + 5: [2023-05-10 12:37:38,902] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt... +18: [2023-05-10 12:37:38,902] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +18: [2023-05-10 12:37:38,902] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +26: [2023-05-10 12:37:38,902] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt... +15: [2023-05-10 12:37:38,902] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... + 6: [2023-05-10 12:37:38,902] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +18: [2023-05-10 12:37:38,902] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +18: [2023-05-10 12:37:38,902] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +18: [2023-05-10 12:37:38,902] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +18: [2023-05-10 12:37:38,902] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +18: [2023-05-10 12:37:38,902] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +26: [2023-05-10 12:37:38,902] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt... +18: [2023-05-10 12:37:38,902] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt... +18: [2023-05-10 12:37:38,902] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +18: [2023-05-10 12:37:38,902] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +18: [2023-05-10 12:37:38,902] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt... +18: [2023-05-10 12:37:38,902] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +18: [2023-05-10 12:37:38,902] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +18: [2023-05-10 12:37:38,903] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +18: [2023-05-10 12:37:38,903] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt... +19: [2023-05-10 12:37:38,903] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +18: [2023-05-10 12:37:38,903] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt... +26: [2023-05-10 12:37:38,904] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +26: [2023-05-10 12:37:38,904] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt... +26: [2023-05-10 12:37:38,904] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt... + 9: [2023-05-10 12:37:38,904] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... + 6: [2023-05-10 12:37:38,905] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... + 6: [2023-05-10 12:37:38,906] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... + 6: [2023-05-10 12:37:38,906] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... + 9: [2023-05-10 12:37:38,906] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +23: [2023-05-10 12:37:38,907] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +23: [2023-05-10 12:37:38,907] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +19: [2023-05-10 12:37:38,907] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... + 9: [2023-05-10 12:37:38,907] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +15: [2023-05-10 12:37:38,907] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +15: [2023-05-10 12:37:38,908] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... + 2: [2023-05-10 12:37:38,909] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. + 2: [2023-05-10 12:37:38,909] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +23: [2023-05-10 12:37:38,910] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +13: [2023-05-10 12:37:38,910] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. + 9: [2023-05-10 12:37:38,912] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +17: [2023-05-10 12:37:38,912] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt. +17: [2023-05-10 12:37:38,912] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt. +17: [2023-05-10 12:37:38,912] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt. + 2: [2023-05-10 12:37:38,912] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. + 2: [2023-05-10 12:37:38,912] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +17: [2023-05-10 12:37:38,912] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt. + 8: [2023-05-10 12:37:38,912] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +19: [2023-05-10 12:37:38,913] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +28: [2023-05-10 12:37:38,913] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +28: [2023-05-10 12:37:38,913] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +26: [2023-05-10 12:37:38,913] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. + 5: [2023-05-10 12:37:38,914] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +28: [2023-05-10 12:37:38,915] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +28: [2023-05-10 12:37:38,915] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +28: [2023-05-10 12:37:38,915] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +28: [2023-05-10 12:37:38,915] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +28: [2023-05-10 12:37:38,916] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +28: [2023-05-10 12:37:38,916] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +28: [2023-05-10 12:37:38,916] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +28: [2023-05-10 12:37:38,916] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt... +23: [2023-05-10 12:37:38,917] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +26: [2023-05-10 12:37:38,917] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +23: [2023-05-10 12:37:38,917] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +19: [2023-05-10 12:37:38,917] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +28: [2023-05-10 12:37:38,917] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt... +28: [2023-05-10 12:37:38,917] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... + 5: [2023-05-10 12:37:38,917] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. + 5: [2023-05-10 12:37:38,917] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +28: [2023-05-10 12:37:38,918] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +19: [2023-05-10 12:37:38,918] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +28: [2023-05-10 12:37:38,918] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt... +19: [2023-05-10 12:37:38,918] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +28: [2023-05-10 12:37:38,918] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +19: [2023-05-10 12:37:38,918] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt... +19: [2023-05-10 12:37:38,918] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt... +28: [2023-05-10 12:37:38,918] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt... + 2: [2023-05-10 12:37:38,920] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... + 2: [2023-05-10 12:37:38,920] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +17: [2023-05-10 12:37:38,921] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +13: [2023-05-10 12:37:38,922] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +17: [2023-05-10 12:37:38,922] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +13: [2023-05-10 12:37:38,922] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +13: [2023-05-10 12:37:38,922] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +13: [2023-05-10 12:37:38,922] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. + 2: [2023-05-10 12:37:38,922] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +26: [2023-05-10 12:37:38,923] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... + 8: [2023-05-10 12:37:38,923] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. + 8: [2023-05-10 12:37:38,923] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. + 2: [2023-05-10 12:37:38,923] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... + 8: [2023-05-10 12:37:38,923] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +17: [2023-05-10 12:37:38,924] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... + 8: [2023-05-10 12:37:38,924] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +17: [2023-05-10 12:37:38,924] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +26: [2023-05-10 12:37:38,924] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +28: [2023-05-10 12:37:38,925] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +26: [2023-05-10 12:37:38,926] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +19: [2023-05-10 12:37:38,926] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +19: [2023-05-10 12:37:38,926] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +18: [2023-05-10 12:37:38,928] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +18: [2023-05-10 12:37:38,928] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +18: [2023-05-10 12:37:38,928] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +18: [2023-05-10 12:37:38,928] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. + 0: [2023-05-10 12:37:38,928] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. + 0: [2023-05-10 12:37:38,928] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. + 5: [2023-05-10 12:37:38,928] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... + 5: [2023-05-10 12:37:38,929] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +29: [2023-05-10 12:37:38,929] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt. +29: [2023-05-10 12:37:38,929] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt. +29: [2023-05-10 12:37:38,929] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt. +29: [2023-05-10 12:37:38,929] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt. + 5: [2023-05-10 12:37:38,930] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. + 5: [2023-05-10 12:37:38,930] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... + 0: [2023-05-10 12:37:38,931] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +26: [2023-05-10 12:37:38,933] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +13: [2023-05-10 12:37:38,933] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... + 1: [2023-05-10 12:37:38,935] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. + 1: [2023-05-10 12:37:38,935] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. + 1: [2023-05-10 12:37:38,935] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. + 1: [2023-05-10 12:37:38,935] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. + 1: [2023-05-10 12:37:38,935] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... + 1: [2023-05-10 12:37:38,935] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... +19: [2023-05-10 12:37:38,935] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. + 0: [2023-05-10 12:37:38,935] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +28: [2023-05-10 12:37:38,935] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... + 8: [2023-05-10 12:37:38,936] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +19: [2023-05-10 12:37:38,936] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... + 1: [2023-05-10 12:37:38,936] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt... + 1: [2023-05-10 12:37:38,936] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt... + 1: [2023-05-10 12:37:38,936] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. + 1: [2023-05-10 12:37:38,936] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. + 1: [2023-05-10 12:37:38,936] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. + 1: [2023-05-10 12:37:38,936] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. + 1: [2023-05-10 12:37:38,936] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... + 1: [2023-05-10 12:37:38,936] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt... + 1: [2023-05-10 12:37:38,936] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt... + 1: [2023-05-10 12:37:38,936] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt... +26: [2023-05-10 12:37:38,937] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +19: [2023-05-10 12:37:38,937] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt... +19: [2023-05-10 12:37:38,937] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +13: [2023-05-10 12:37:38,938] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +13: [2023-05-10 12:37:38,938] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... + 8: [2023-05-10 12:37:38,939] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... + 8: [2023-05-10 12:37:38,939] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... + 0: [2023-05-10 12:37:38,939] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +19: [2023-05-10 12:37:38,940] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt... +29: [2023-05-10 12:37:38,941] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +18: [2023-05-10 12:37:38,942] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +18: [2023-05-10 12:37:38,942] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... + 5: [2023-05-10 12:37:38,942] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +18: [2023-05-10 12:37:38,942] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +18: [2023-05-10 12:37:38,942] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +10: [2023-05-10 12:37:38,942] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +10: [2023-05-10 12:37:38,942] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +10: [2023-05-10 12:37:38,942] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +10: [2023-05-10 12:37:38,943] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. + 0: [2023-05-10 12:37:38,943] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... + 0: [2023-05-10 12:37:38,944] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +29: [2023-05-10 12:37:38,944] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +10: [2023-05-10 12:37:38,944] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +30: [2023-05-10 12:37:38,944] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +30: [2023-05-10 12:37:38,945] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +10: [2023-05-10 12:37:38,945] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +10: [2023-05-10 12:37:38,945] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... + 0: [2023-05-10 12:37:38,946] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +30: [2023-05-10 12:37:38,946] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +26: [2023-05-10 12:37:38,946] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +10: [2023-05-10 12:37:38,947] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +29: [2023-05-10 12:37:38,947] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +30: [2023-05-10 12:37:38,947] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +30: [2023-05-10 12:37:38,947] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +29: [2023-05-10 12:37:38,948] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +28: [2023-05-10 12:37:38,948] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +28: [2023-05-10 12:37:38,948] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +28: [2023-05-10 12:37:38,948] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. + 6: [2023-05-10 12:37:38,948] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. + 6: [2023-05-10 12:37:38,948] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +30: [2023-05-10 12:37:38,949] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... + 6: [2023-05-10 12:37:38,949] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt... + 6: [2023-05-10 12:37:38,949] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. + 6: [2023-05-10 12:37:38,949] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. + 6: [2023-05-10 12:37:38,949] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. + 6: [2023-05-10 12:37:38,949] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. + 6: [2023-05-10 12:37:38,949] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. + 6: [2023-05-10 12:37:38,949] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... + 6: [2023-05-10 12:37:38,949] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +30: [2023-05-10 12:37:38,949] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... + 6: [2023-05-10 12:37:38,950] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. + 6: [2023-05-10 12:37:38,951] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... + 6: [2023-05-10 12:37:38,951] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt... + 1: [2023-05-10 12:37:38,951] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. + 1: [2023-05-10 12:37:38,951] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +30: [2023-05-10 12:37:38,952] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... + 6: [2023-05-10 12:37:38,953] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... + 6: [2023-05-10 12:37:38,953] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt... + 6: [2023-05-10 12:37:38,953] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt... + 1: [2023-05-10 12:37:38,955] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. + 1: [2023-05-10 12:37:38,955] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_00-model_states.pt. +29: [2023-05-10 12:37:38,955] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +29: [2023-05-10 12:37:38,955] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt... +28: [2023-05-10 12:37:38,957] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +28: [2023-05-10 12:37:38,958] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +28: [2023-05-10 12:37:38,958] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +30: [2023-05-10 12:37:38,958] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. + 1: [2023-05-10 12:37:38,964] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... + 1: [2023-05-10 12:37:38,964] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... + 1: [2023-05-10 12:37:38,967] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... + 1: [2023-05-10 12:37:38,967] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +12: [2023-05-10 12:37:38,967] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +12: [2023-05-10 12:37:38,967] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +12: [2023-05-10 12:37:38,967] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +12: [2023-05-10 12:37:38,967] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +30: [2023-05-10 12:37:38,967] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... + 6: [2023-05-10 12:37:38,967] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. + 6: [2023-05-10 12:37:38,967] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +12: [2023-05-10 12:37:38,968] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +12: [2023-05-10 12:37:38,968] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +29: [2023-05-10 12:37:38,970] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +12: [2023-05-10 12:37:38,970] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +10: [2023-05-10 12:37:38,970] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +12: [2023-05-10 12:37:38,970] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +29: [2023-05-10 12:37:38,972] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt... +29: [2023-05-10 12:37:38,974] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +10: [2023-05-10 12:37:38,975] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +10: [2023-05-10 12:37:38,975] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +29: [2023-05-10 12:37:38,975] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +10: [2023-05-10 12:37:38,976] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. + 6: [2023-05-10 12:37:38,976] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +30: [2023-05-10 12:37:38,977] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. + 6: [2023-05-10 12:37:38,977] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +29: [2023-05-10 12:37:38,977] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt... +29: [2023-05-10 12:37:38,978] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt... +11: [2023-05-10 12:37:38,979] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +11: [2023-05-10 12:37:38,979] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +11: [2023-05-10 12:37:38,979] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +11: [2023-05-10 12:37:38,979] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +11: [2023-05-10 12:37:38,979] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +11: [2023-05-10 12:37:38,979] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +12: [2023-05-10 12:37:38,979] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +10: [2023-05-10 12:37:38,979] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... + 6: [2023-05-10 12:37:38,980] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +12: [2023-05-10 12:37:38,980] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +30: [2023-05-10 12:37:38,981] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. + 6: [2023-05-10 12:37:38,983] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +11: [2023-05-10 12:37:38,983] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +11: [2023-05-10 12:37:38,983] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +30: [2023-05-10 12:37:38,986] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +10: [2023-05-10 12:37:38,988] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +10: [2023-05-10 12:37:38,988] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +10: [2023-05-10 12:37:38,989] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +30: [2023-05-10 12:37:38,990] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +12: [2023-05-10 12:37:38,990] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... + 6: [2023-05-10 12:37:38,990] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +12: [2023-05-10 12:37:38,991] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +30: [2023-05-10 12:37:38,991] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +11: [2023-05-10 12:37:38,993] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. + 6: [2023-05-10 12:37:38,993] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +11: [2023-05-10 12:37:39,000] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +12: [2023-05-10 12:37:38,999] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +12: [2023-05-10 12:37:39,000] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +30: [2023-05-10 12:37:39,003] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +12: [2023-05-10 12:37:39,009] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +12: [2023-05-10 12:37:39,009] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +11: [2023-05-10 12:37:39,011] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +11: [2023-05-10 12:37:39,012] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +11: [2023-05-10 12:37:39,012] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +17: [2023-05-10 12:37:39,013] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +17: [2023-05-10 12:37:39,013] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +17: [2023-05-10 12:37:39,013] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +17: [2023-05-10 12:37:39,013] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +17: [2023-05-10 12:37:39,013] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +17: [2023-05-10 12:37:39,013] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +17: [2023-05-10 12:37:39,013] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +17: [2023-05-10 12:37:39,013] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +17: [2023-05-10 12:37:39,014] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +17: [2023-05-10 12:37:39,014] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +17: [2023-05-10 12:37:39,014] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt... +17: [2023-05-10 12:37:39,014] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt... +17: [2023-05-10 12:37:39,015] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +11: [2023-05-10 12:37:39,015] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +14: [2023-05-10 12:37:39,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +17: [2023-05-10 12:37:39,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt... +14: [2023-05-10 12:37:39,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +14: [2023-05-10 12:37:39,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +17: [2023-05-10 12:37:39,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt... +17: [2023-05-10 12:37:39,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +14: [2023-05-10 12:37:39,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +14: [2023-05-10 12:37:39,019] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +14: [2023-05-10 12:37:39,019] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +14: [2023-05-10 12:37:39,020] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +14: [2023-05-10 12:37:39,020] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +24: [2023-05-10 12:37:39,023] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt. +24: [2023-05-10 12:37:39,023] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt. +24: [2023-05-10 12:37:39,023] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt. +11: [2023-05-10 12:37:39,024] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +24: [2023-05-10 12:37:39,023] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt. +11: [2023-05-10 12:37:39,024] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +17: [2023-05-10 12:37:39,029] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +17: [2023-05-10 12:37:39,029] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +31: [2023-05-10 12:37:39,032] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +31: [2023-05-10 12:37:39,032] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +31: [2023-05-10 12:37:39,032] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +31: [2023-05-10 12:37:39,032] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +31: [2023-05-10 12:37:39,032] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +31: [2023-05-10 12:37:39,032] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +31: [2023-05-10 12:37:39,032] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +31: [2023-05-10 12:37:39,032] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +24: [2023-05-10 12:37:39,034] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +24: [2023-05-10 12:37:39,034] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +24: [2023-05-10 12:37:39,035] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +24: [2023-05-10 12:37:39,035] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +24: [2023-05-10 12:37:39,036] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +24: [2023-05-10 12:37:39,037] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +24: [2023-05-10 12:37:39,038] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +24: [2023-05-10 12:37:39,038] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +17: [2023-05-10 12:37:39,038] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +25: [2023-05-10 12:37:39,038] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +25: [2023-05-10 12:37:39,038] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +25: [2023-05-10 12:37:39,038] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +24: [2023-05-10 12:37:39,039] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +17: [2023-05-10 12:37:39,039] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +24: [2023-05-10 12:37:39,040] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +22: [2023-05-10 12:37:39,040] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +22: [2023-05-10 12:37:39,040] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +22: [2023-05-10 12:37:39,041] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +22: [2023-05-10 12:37:39,041] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +22: [2023-05-10 12:37:39,041] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +22: [2023-05-10 12:37:39,041] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +22: [2023-05-10 12:37:39,041] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +24: [2023-05-10 12:37:39,041] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +22: [2023-05-10 12:37:39,041] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +25: [2023-05-10 12:37:39,041] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +25: [2023-05-10 12:37:39,041] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +12: [2023-05-10 12:37:39,041] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt. +12: [2023-05-10 12:37:39,042] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt. +12: [2023-05-10 12:37:39,042] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt. +12: [2023-05-10 12:37:39,042] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt. +17: [2023-05-10 12:37:39,042] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +25: [2023-05-10 12:37:39,043] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +31: [2023-05-10 12:37:39,044] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +31: [2023-05-10 12:37:39,044] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +24: [2023-05-10 12:37:39,045] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +25: [2023-05-10 12:37:39,045] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +17: [2023-05-10 12:37:39,046] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +25: [2023-05-10 12:37:39,046] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +14: [2023-05-10 12:37:39,048] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +14: [2023-05-10 12:37:39,048] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +14: [2023-05-10 12:37:39,048] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt. +14: [2023-05-10 12:37:39,049] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt. +14: [2023-05-10 12:37:39,049] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt. +30: [2023-05-10 12:37:39,048] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt. +30: [2023-05-10 12:37:39,048] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt. +30: [2023-05-10 12:37:39,048] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt. +14: [2023-05-10 12:37:39,049] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt. +31: [2023-05-10 12:37:39,050] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +31: [2023-05-10 12:37:39,050] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +14: [2023-05-10 12:37:39,050] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +30: [2023-05-10 12:37:39,050] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt. +16: [2023-05-10 12:37:39,051] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt. +16: [2023-05-10 12:37:39,051] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt. +25: [2023-05-10 12:37:39,051] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +17: [2023-05-10 12:37:39,051] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +16: [2023-05-10 12:37:39,051] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt. +14: [2023-05-10 12:37:39,051] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +16: [2023-05-10 12:37:39,051] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt. +24: [2023-05-10 12:37:39,052] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +22: [2023-05-10 12:37:39,052] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +12: [2023-05-10 12:37:39,053] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +12: [2023-05-10 12:37:39,053] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +31: [2023-05-10 12:37:39,054] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +16: [2023-05-10 12:37:39,054] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +16: [2023-05-10 12:37:39,054] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +16: [2023-05-10 12:37:39,054] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +16: [2023-05-10 12:37:39,054] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +12: [2023-05-10 12:37:39,054] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +12: [2023-05-10 12:37:39,054] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... + 3: [2023-05-10 12:37:39,055] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. + 3: [2023-05-10 12:37:39,055] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. + 3: [2023-05-10 12:37:39,055] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. + 3: [2023-05-10 12:37:39,055] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... + 3: [2023-05-10 12:37:39,055] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... + 3: [2023-05-10 12:37:39,055] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... + 3: [2023-05-10 12:37:39,055] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. + 3: [2023-05-10 12:37:39,055] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +17: [2023-05-10 12:37:39,056] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +31: [2023-05-10 12:37:39,056] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +24: [2023-05-10 12:37:39,056] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +24: [2023-05-10 12:37:39,056] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +24: [2023-05-10 12:37:39,057] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt... +24: [2023-05-10 12:37:39,057] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt... +16: [2023-05-10 12:37:39,057] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +16: [2023-05-10 12:37:39,058] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +16: [2023-05-10 12:37:39,058] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +30: [2023-05-10 12:37:39,060] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +31: [2023-05-10 12:37:39,060] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +31: [2023-05-10 12:37:39,060] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +22: [2023-05-10 12:37:39,061] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +22: [2023-05-10 12:37:39,061] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +22: [2023-05-10 12:37:39,061] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +16: [2023-05-10 12:37:39,061] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +30: [2023-05-10 12:37:39,061] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +30: [2023-05-10 12:37:39,062] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +30: [2023-05-10 12:37:39,062] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +14: [2023-05-10 12:37:39,064] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +25: [2023-05-10 12:37:39,064] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +14: [2023-05-10 12:37:39,064] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +22: [2023-05-10 12:37:39,065] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +14: [2023-05-10 12:37:39,065] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +14: [2023-05-10 12:37:39,065] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +14: [2023-05-10 12:37:39,065] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +14: [2023-05-10 12:37:39,065] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... + 7: [2023-05-10 12:37:39,066] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +14: [2023-05-10 12:37:39,066] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... + 7: [2023-05-10 12:37:39,066] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +14: [2023-05-10 12:37:39,066] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +24: [2023-05-10 12:37:39,066] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +16: [2023-05-10 12:37:39,066] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +16: [2023-05-10 12:37:39,066] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +11: [2023-05-10 12:37:39,066] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt. + 7: [2023-05-10 12:37:39,066] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +11: [2023-05-10 12:37:39,066] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt. +11: [2023-05-10 12:37:39,066] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt. +11: [2023-05-10 12:37:39,067] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt. +24: [2023-05-10 12:37:39,068] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. + 3: [2023-05-10 12:37:39,068] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. + 7: [2023-05-10 12:37:39,068] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. + 7: [2023-05-10 12:37:39,068] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. + 7: [2023-05-10 12:37:39,069] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +16: [2023-05-10 12:37:39,069] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +16: [2023-05-10 12:37:39,069] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... + 7: [2023-05-10 12:37:39,070] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... + 7: [2023-05-10 12:37:39,070] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +22: [2023-05-10 12:37:39,071] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +22: [2023-05-10 12:37:39,071] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +16: [2023-05-10 12:37:39,073] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +24: [2023-05-10 12:37:39,074] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +24: [2023-05-10 12:37:39,074] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +22: [2023-05-10 12:37:39,074] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +24: [2023-05-10 12:37:39,074] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +25: [2023-05-10 12:37:39,074] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. + 3: [2023-05-10 12:37:39,075] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. + 3: [2023-05-10 12:37:39,075] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. + 3: [2023-05-10 12:37:39,075] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +30: [2023-05-10 12:37:39,076] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +25: [2023-05-10 12:37:39,076] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +30: [2023-05-10 12:37:39,077] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt... +24: [2023-05-10 12:37:39,077] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt... +11: [2023-05-10 12:37:39,078] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +14: [2023-05-10 12:37:39,078] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +25: [2023-05-10 12:37:39,078] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +16: [2023-05-10 12:37:39,078] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +16: [2023-05-10 12:37:39,078] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +14: [2023-05-10 12:37:39,079] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt... +12: [2023-05-10 12:37:39,079] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +12: [2023-05-10 12:37:39,080] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt... +12: [2023-05-10 12:37:39,081] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +24: [2023-05-10 12:37:39,081] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +24: [2023-05-10 12:37:39,081] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +12: [2023-05-10 12:37:39,082] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +12: [2023-05-10 12:37:39,082] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +12: [2023-05-10 12:37:39,083] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt... +11: [2023-05-10 12:37:39,082] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... + 3: [2023-05-10 12:37:39,084] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +24: [2023-05-10 12:37:39,084] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +12: [2023-05-10 12:37:39,085] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt... +11: [2023-05-10 12:37:39,085] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +12: [2023-05-10 12:37:39,085] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt... + 7: [2023-05-10 12:37:39,085] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +24: [2023-05-10 12:37:39,086] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt... +25: [2023-05-10 12:37:39,086] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +24: [2023-05-10 12:37:39,087] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +11: [2023-05-10 12:37:39,086] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +16: [2023-05-10 12:37:39,087] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +29: [2023-05-10 12:37:39,088] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +29: [2023-05-10 12:37:39,088] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +29: [2023-05-10 12:37:39,088] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +29: [2023-05-10 12:37:39,088] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +29: [2023-05-10 12:37:39,088] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +29: [2023-05-10 12:37:39,088] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +29: [2023-05-10 12:37:39,088] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +29: [2023-05-10 12:37:39,088] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +25: [2023-05-10 12:37:39,089] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +16: [2023-05-10 12:37:39,090] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. + 3: [2023-05-10 12:37:39,090] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +16: [2023-05-10 12:37:39,091] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt... +25: [2023-05-10 12:37:39,091] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... + 3: [2023-05-10 12:37:39,091] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +10: [2023-05-10 12:37:39,091] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt. +10: [2023-05-10 12:37:39,091] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt. + 3: [2023-05-10 12:37:39,091] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +10: [2023-05-10 12:37:39,091] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt. +10: [2023-05-10 12:37:39,092] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt. +30: [2023-05-10 12:37:39,092] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +30: [2023-05-10 12:37:39,093] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +30: [2023-05-10 12:37:39,093] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +14: [2023-05-10 12:37:39,094] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. + 4: [2023-05-10 12:37:39,094] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. + 4: [2023-05-10 12:37:39,094] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +16: [2023-05-10 12:37:39,094] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... + 7: [2023-05-10 12:37:39,094] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +30: [2023-05-10 12:37:39,094] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt... +16: [2023-05-10 12:37:39,095] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +14: [2023-05-10 12:37:39,095] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +14: [2023-05-10 12:37:39,095] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +11: [2023-05-10 12:37:39,095] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +30: [2023-05-10 12:37:39,095] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt... +11: [2023-05-10 12:37:39,095] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt... +14: [2023-05-10 12:37:39,096] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt... +30: [2023-05-10 12:37:39,096] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt... + 4: [2023-05-10 12:37:39,096] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. + 7: [2023-05-10 12:37:39,096] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +16: [2023-05-10 12:37:39,097] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +16: [2023-05-10 12:37:39,098] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. + 4: [2023-05-10 12:37:39,098] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. + 4: [2023-05-10 12:37:39,098] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +16: [2023-05-10 12:37:39,098] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt... + 4: [2023-05-10 12:37:39,098] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +11: [2023-05-10 12:37:39,098] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +11: [2023-05-10 12:37:39,098] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt... + 4: [2023-05-10 12:37:39,099] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... + 4: [2023-05-10 12:37:39,099] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +21: [2023-05-10 12:37:39,099] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +14: [2023-05-10 12:37:39,099] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt... +21: [2023-05-10 12:37:39,100] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +14: [2023-05-10 12:37:39,100] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt... +21: [2023-05-10 12:37:39,100] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +21: [2023-05-10 12:37:39,102] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +21: [2023-05-10 12:37:39,102] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +29: [2023-05-10 12:37:39,102] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. + 7: [2023-05-10 12:37:39,102] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +29: [2023-05-10 12:37:39,103] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +21: [2023-05-10 12:37:39,104] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +16: [2023-05-10 12:37:39,104] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. + 7: [2023-05-10 12:37:39,105] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +16: [2023-05-10 12:37:39,105] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. + 7: [2023-05-10 12:37:39,105] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +21: [2023-05-10 12:37:39,105] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +20: [2023-05-10 12:37:39,105] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +20: [2023-05-10 12:37:39,105] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +21: [2023-05-10 12:37:39,105] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +20: [2023-05-10 12:37:39,105] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +20: [2023-05-10 12:37:39,105] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +10: [2023-05-10 12:37:39,106] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +10: [2023-05-10 12:37:39,106] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +10: [2023-05-10 12:37:39,107] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +10: [2023-05-10 12:37:39,107] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +29: [2023-05-10 12:37:39,107] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +29: [2023-05-10 12:37:39,107] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +16: [2023-05-10 12:37:39,107] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt... +16: [2023-05-10 12:37:39,108] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt... +16: [2023-05-10 12:37:39,108] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +20: [2023-05-10 12:37:39,108] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +20: [2023-05-10 12:37:39,108] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +20: [2023-05-10 12:37:39,108] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +20: [2023-05-10 12:37:39,108] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... + 4: [2023-05-10 12:37:39,111] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. + 7: [2023-05-10 12:37:39,111] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +21: [2023-05-10 12:37:39,112] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +11: [2023-05-10 12:37:39,113] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. + 7: [2023-05-10 12:37:39,113] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +29: [2023-05-10 12:37:39,115] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... + 4: [2023-05-10 12:37:39,115] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +11: [2023-05-10 12:37:39,116] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt... +11: [2023-05-10 12:37:39,117] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +29: [2023-05-10 12:37:39,120] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... + 4: [2023-05-10 12:37:39,120] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +11: [2023-05-10 12:37:39,121] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt... +20: [2023-05-10 12:37:39,121] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +20: [2023-05-10 12:37:39,121] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +29: [2023-05-10 12:37:39,121] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +29: [2023-05-10 12:37:39,123] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +20: [2023-05-10 12:37:39,123] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +20: [2023-05-10 12:37:39,123] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +27: [2023-05-10 12:37:39,124] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +27: [2023-05-10 12:37:39,124] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +27: [2023-05-10 12:37:39,124] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +27: [2023-05-10 12:37:39,124] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +27: [2023-05-10 12:37:39,124] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +27: [2023-05-10 12:37:39,125] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. + 9: [2023-05-10 12:37:39,125] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. + 9: [2023-05-10 12:37:39,125] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... + 4: [2023-05-10 12:37:39,126] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +27: [2023-05-10 12:37:39,126] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +21: [2023-05-10 12:37:39,127] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... + 4: [2023-05-10 12:37:39,127] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +27: [2023-05-10 12:37:39,127] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... + 9: [2023-05-10 12:37:39,127] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +28: [2023-05-10 12:37:39,128] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +28: [2023-05-10 12:37:39,128] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +28: [2023-05-10 12:37:39,128] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +28: [2023-05-10 12:37:39,128] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... + 9: [2023-05-10 12:37:39,129] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +28: [2023-05-10 12:37:39,130] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +28: [2023-05-10 12:37:39,130] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +28: [2023-05-10 12:37:39,130] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... + 9: [2023-05-10 12:37:39,130] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. + 9: [2023-05-10 12:37:39,130] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +10: [2023-05-10 12:37:39,130] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +28: [2023-05-10 12:37:39,131] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... + 9: [2023-05-10 12:37:39,132] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... + 4: [2023-05-10 12:37:39,133] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +10: [2023-05-10 12:37:39,133] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt... +20: [2023-05-10 12:37:39,133] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... + 9: [2023-05-10 12:37:39,133] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +13: [2023-05-10 12:37:39,133] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +13: [2023-05-10 12:37:39,133] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +13: [2023-05-10 12:37:39,134] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +26: [2023-05-10 12:37:39,134] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt. +26: [2023-05-10 12:37:39,134] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt. +26: [2023-05-10 12:37:39,134] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt. + 5: [2023-05-10 12:37:39,134] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. + 5: [2023-05-10 12:37:39,134] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... + 5: [2023-05-10 12:37:39,134] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +13: [2023-05-10 12:37:39,134] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +26: [2023-05-10 12:37:39,135] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt. + 2: [2023-05-10 12:37:39,135] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. + 5: [2023-05-10 12:37:39,135] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +13: [2023-05-10 12:37:39,135] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. + 2: [2023-05-10 12:37:39,135] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... + 2: [2023-05-10 12:37:39,135] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. + 4: [2023-05-10 12:37:39,135] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +21: [2023-05-10 12:37:39,136] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +21: [2023-05-10 12:37:39,136] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +10: [2023-05-10 12:37:39,136] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +10: [2023-05-10 12:37:39,136] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +10: [2023-05-10 12:37:39,136] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +20: [2023-05-10 12:37:39,136] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +20: [2023-05-10 12:37:39,136] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... + 0: [2023-05-10 12:37:39,137] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. + 0: [2023-05-10 12:37:39,137] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. + 0: [2023-05-10 12:37:39,137] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... + 0: [2023-05-10 12:37:39,137] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +13: [2023-05-10 12:37:39,137] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +20: [2023-05-10 12:37:39,137] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... + 2: [2023-05-10 12:37:39,137] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +13: [2023-05-10 12:37:39,137] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +10: [2023-05-10 12:37:39,137] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt... + 8: [2023-05-10 12:37:39,137] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +27: [2023-05-10 12:37:39,137] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +21: [2023-05-10 12:37:39,137] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. + 8: [2023-05-10 12:37:39,137] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. + 8: [2023-05-10 12:37:39,137] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. + 8: [2023-05-10 12:37:39,138] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. + 8: [2023-05-10 12:37:39,138] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... + 2: [2023-05-10 12:37:39,138] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. + 2: [2023-05-10 12:37:39,138] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +13: [2023-05-10 12:37:39,138] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... + 0: [2023-05-10 12:37:39,138] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. + 0: [2023-05-10 12:37:39,138] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. + 0: [2023-05-10 12:37:39,138] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +10: [2023-05-10 12:37:39,138] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt... +27: [2023-05-10 12:37:39,138] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +10: [2023-05-10 12:37:39,138] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt... + 5: [2023-05-10 12:37:39,138] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. + 8: [2023-05-10 12:37:39,139] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... + 5: [2023-05-10 12:37:39,139] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. + 2: [2023-05-10 12:37:39,140] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... + 2: [2023-05-10 12:37:39,140] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... + 8: [2023-05-10 12:37:39,140] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... + 8: [2023-05-10 12:37:39,140] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +25: [2023-05-10 12:37:39,140] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt. + 5: [2023-05-10 12:37:39,141] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +25: [2023-05-10 12:37:39,141] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt. +25: [2023-05-10 12:37:39,141] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt. +25: [2023-05-10 12:37:39,141] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt. + 5: [2023-05-10 12:37:39,141] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... + 8: [2023-05-10 12:37:39,141] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt. + 8: [2023-05-10 12:37:39,141] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt. + 9: [2023-05-10 12:37:39,141] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. + 8: [2023-05-10 12:37:39,142] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt. + 0: [2023-05-10 12:37:39,142] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... + 8: [2023-05-10 12:37:39,142] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt. + 4: [2023-05-10 12:37:39,144] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +26: [2023-05-10 12:37:39,144] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... + 1: [2023-05-10 12:37:39,144] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt. + 1: [2023-05-10 12:37:39,144] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt. + 1: [2023-05-10 12:37:39,144] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt. +23: [2023-05-10 12:37:39,145] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt. + 1: [2023-05-10 12:37:39,145] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt. +23: [2023-05-10 12:37:39,145] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt. +23: [2023-05-10 12:37:39,145] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt. +23: [2023-05-10 12:37:39,145] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt. +23: [2023-05-10 12:37:39,145] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +23: [2023-05-10 12:37:39,145] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +23: [2023-05-10 12:37:39,146] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +23: [2023-05-10 12:37:39,146] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +27: [2023-05-10 12:37:39,146] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +26: [2023-05-10 12:37:39,144] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +26: [2023-05-10 12:37:39,145] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +26: [2023-05-10 12:37:39,145] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +23: [2023-05-10 12:37:39,146] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +23: [2023-05-10 12:37:39,146] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +23: [2023-05-10 12:37:39,146] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +23: [2023-05-10 12:37:39,146] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... + 5: [2023-05-10 12:37:39,147] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. + 2: [2023-05-10 12:37:39,147] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt. + 2: [2023-05-10 12:37:39,147] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt. + 2: [2023-05-10 12:37:39,147] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt. + 2: [2023-05-10 12:37:39,148] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt. +28: [2023-05-10 12:37:39,147] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +28: [2023-05-10 12:37:39,147] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +21: [2023-05-10 12:37:39,148] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +27: [2023-05-10 12:37:39,148] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +21: [2023-05-10 12:37:39,148] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +13: [2023-05-10 12:37:39,149] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. + 5: [2023-05-10 12:37:39,149] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +19: [2023-05-10 12:37:39,149] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt. + 7: [2023-05-10 12:37:39,149] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt. + 7: [2023-05-10 12:37:39,149] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt. + 7: [2023-05-10 12:37:39,150] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt. + 7: [2023-05-10 12:37:39,150] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt. +28: [2023-05-10 12:37:39,150] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +19: [2023-05-10 12:37:39,151] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt. +21: [2023-05-10 12:37:39,151] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... + 9: [2023-05-10 12:37:39,152] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +15: [2023-05-10 12:37:39,152] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +15: [2023-05-10 12:37:39,152] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +15: [2023-05-10 12:37:39,152] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +15: [2023-05-10 12:37:39,153] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +19: [2023-05-10 12:37:39,153] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt. +19: [2023-05-10 12:37:39,153] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt. + 8: [2023-05-10 12:37:39,154] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... + 8: [2023-05-10 12:37:39,154] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... + 1: [2023-05-10 12:37:39,154] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +25: [2023-05-10 12:37:39,154] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +25: [2023-05-10 12:37:39,154] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +15: [2023-05-10 12:37:39,154] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... + 8: [2023-05-10 12:37:39,155] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... + 8: [2023-05-10 12:37:39,155] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +27: [2023-05-10 12:37:39,155] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +15: [2023-05-10 12:37:39,155] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +25: [2023-05-10 12:37:39,155] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +23: [2023-05-10 12:37:39,155] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... + 2: [2023-05-10 12:37:39,155] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +15: [2023-05-10 12:37:39,155] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... + 5: [2023-05-10 12:37:39,156] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +28: [2023-05-10 12:37:39,156] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +28: [2023-05-10 12:37:39,156] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... + 4: [2023-05-10 12:37:39,156] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt. + 4: [2023-05-10 12:37:39,156] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt. + 4: [2023-05-10 12:37:39,156] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt. +15: [2023-05-10 12:37:39,156] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... + 4: [2023-05-10 12:37:39,157] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt. + 9: [2023-05-10 12:37:39,157] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt. + 9: [2023-05-10 12:37:39,157] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt. +23: [2023-05-10 12:37:39,157] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... + 9: [2023-05-10 12:37:39,158] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt. +26: [2023-05-10 12:37:39,158] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +26: [2023-05-10 12:37:39,158] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... + 1: [2023-05-10 12:37:39,158] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +26: [2023-05-10 12:37:39,158] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. + 1: [2023-05-10 12:37:39,158] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... + 1: [2023-05-10 12:37:39,158] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... + 2: [2023-05-10 12:37:39,158] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +26: [2023-05-10 12:37:39,158] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +27: [2023-05-10 12:37:39,158] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. + 9: [2023-05-10 12:37:39,158] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +25: [2023-05-10 12:37:39,158] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +28: [2023-05-10 12:37:39,158] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +26: [2023-05-10 12:37:39,158] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +23: [2023-05-10 12:37:39,159] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +23: [2023-05-10 12:37:39,159] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... + 7: [2023-05-10 12:37:39,159] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +26: [2023-05-10 12:37:39,159] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt... +26: [2023-05-10 12:37:39,159] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +26: [2023-05-10 12:37:39,160] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +19: [2023-05-10 12:37:39,160] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +26: [2023-05-10 12:37:39,160] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +26: [2023-05-10 12:37:39,160] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +23: [2023-05-10 12:37:39,160] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +19: [2023-05-10 12:37:39,160] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... + 9: [2023-05-10 12:37:39,160] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt. +28: [2023-05-10 12:37:39,161] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... + 7: [2023-05-10 12:37:39,161] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +15: [2023-05-10 12:37:39,161] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt. + 7: [2023-05-10 12:37:39,161] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... + 7: [2023-05-10 12:37:39,161] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +15: [2023-05-10 12:37:39,161] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt. +15: [2023-05-10 12:37:39,161] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt. + 8: [2023-05-10 12:37:39,161] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. + 2: [2023-05-10 12:37:39,161] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... + 2: [2023-05-10 12:37:39,161] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... + 2: [2023-05-10 12:37:39,161] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... + 0: [2023-05-10 12:37:39,162] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. + 0: [2023-05-10 12:37:39,162] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. + 0: [2023-05-10 12:37:39,162] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. + 5: [2023-05-10 12:37:39,162] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +15: [2023-05-10 12:37:39,163] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt. +30: [2023-05-10 12:37:39,163] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +30: [2023-05-10 12:37:39,163] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +30: [2023-05-10 12:37:39,163] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +30: [2023-05-10 12:37:39,163] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +30: [2023-05-10 12:37:39,163] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +30: [2023-05-10 12:37:39,163] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +30: [2023-05-10 12:37:39,163] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +30: [2023-05-10 12:37:39,164] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +19: [2023-05-10 12:37:39,164] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... + 9: [2023-05-10 12:37:39,164] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +13: [2023-05-10 12:37:39,164] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +27: [2023-05-10 12:37:39,164] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +26: [2023-05-10 12:37:39,164] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +26: [2023-05-10 12:37:39,164] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt... +28: [2023-05-10 12:37:39,165] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +13: [2023-05-10 12:37:39,165] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. + 2: [2023-05-10 12:37:39,165] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +19: [2023-05-10 12:37:39,165] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... + 2: [2023-05-10 12:37:39,165] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. + 4: [2023-05-10 12:37:39,166] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... + 9: [2023-05-10 12:37:39,166] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +23: [2023-05-10 12:37:39,166] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. + 6: [2023-05-10 12:37:39,167] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt. + 6: [2023-05-10 12:37:39,167] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt. +27: [2023-05-10 12:37:39,168] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... + 4: [2023-05-10 12:37:39,168] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... + 4: [2023-05-10 12:37:39,168] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... + 4: [2023-05-10 12:37:39,168] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +25: [2023-05-10 12:37:39,168] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. + 9: [2023-05-10 12:37:39,169] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +25: [2023-05-10 12:37:39,169] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +25: [2023-05-10 12:37:39,169] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +23: [2023-05-10 12:37:39,169] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +23: [2023-05-10 12:37:39,169] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +25: [2023-05-10 12:37:39,169] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt... +25: [2023-05-10 12:37:39,169] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt... +25: [2023-05-10 12:37:39,169] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt... + 6: [2023-05-10 12:37:39,169] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt. +23: [2023-05-10 12:37:39,170] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. + 6: [2023-05-10 12:37:39,170] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt. +26: [2023-05-10 12:37:39,170] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +26: [2023-05-10 12:37:39,170] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +26: [2023-05-10 12:37:39,170] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +26: [2023-05-10 12:37:39,170] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt... +26: [2023-05-10 12:37:39,170] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt... + 7: [2023-05-10 12:37:39,171] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. + 9: [2023-05-10 12:37:39,171] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... + 5: [2023-05-10 12:37:39,171] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. + 7: [2023-05-10 12:37:39,171] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt... +26: [2023-05-10 12:37:39,172] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. + 9: [2023-05-10 12:37:39,172] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +15: [2023-05-10 12:37:39,172] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... + 9: [2023-05-10 12:37:39,173] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... + 0: [2023-05-10 12:37:39,173] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +13: [2023-05-10 12:37:39,173] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +18: [2023-05-10 12:37:39,173] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +18: [2023-05-10 12:37:39,173] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +18: [2023-05-10 12:37:39,173] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. + 8: [2023-05-10 12:37:39,173] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... + 2: [2023-05-10 12:37:39,173] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +15: [2023-05-10 12:37:39,173] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +13: [2023-05-10 12:37:39,174] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. + 0: [2023-05-10 12:37:39,174] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... + 5: [2023-05-10 12:37:39,174] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. + 9: [2023-05-10 12:37:39,174] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +13: [2023-05-10 12:37:39,174] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +15: [2023-05-10 12:37:39,174] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +15: [2023-05-10 12:37:39,174] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... + 8: [2023-05-10 12:37:39,174] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. + 2: [2023-05-10 12:37:39,174] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +18: [2023-05-10 12:37:39,174] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. + 0: [2023-05-10 12:37:39,175] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... + 9: [2023-05-10 12:37:39,175] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... + 2: [2023-05-10 12:37:39,176] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. + 2: [2023-05-10 12:37:39,176] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. + 3: [2023-05-10 12:37:39,176] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt. +23: [2023-05-10 12:37:39,176] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... + 3: [2023-05-10 12:37:39,176] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt. +30: [2023-05-10 12:37:39,175] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +22: [2023-05-10 12:37:39,176] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt. +22: [2023-05-10 12:37:39,176] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt. + 3: [2023-05-10 12:37:39,176] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt. + 3: [2023-05-10 12:37:39,176] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt. +22: [2023-05-10 12:37:39,176] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt. +22: [2023-05-10 12:37:39,176] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt. +18: [2023-05-10 12:37:39,177] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +18: [2023-05-10 12:37:39,177] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +18: [2023-05-10 12:37:39,177] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +18: [2023-05-10 12:37:39,177] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... + 2: [2023-05-10 12:37:39,177] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt... +18: [2023-05-10 12:37:39,177] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt. +18: [2023-05-10 12:37:39,177] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt. + 6: [2023-05-10 12:37:39,177] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +18: [2023-05-10 12:37:39,177] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt. +18: [2023-05-10 12:37:39,177] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt. + 9: [2023-05-10 12:37:39,178] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... + 6: [2023-05-10 12:37:39,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... + 1: [2023-05-10 12:37:39,179] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. + 1: [2023-05-10 12:37:39,179] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. + 1: [2023-05-10 12:37:39,180] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt... + 4: [2023-05-10 12:37:39,180] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +30: [2023-05-10 12:37:39,180] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. + 4: [2023-05-10 12:37:39,180] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt... +23: [2023-05-10 12:37:39,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... + 5: [2023-05-10 12:37:39,181] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +26: [2023-05-10 12:37:39,181] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. + 1: [2023-05-10 12:37:39,181] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +23: [2023-05-10 12:37:39,181] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. + 1: [2023-05-10 12:37:39,182] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. + 1: [2023-05-10 12:37:39,182] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. + 6: [2023-05-10 12:37:39,182] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +26: [2023-05-10 12:37:39,182] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +26: [2023-05-10 12:37:39,182] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +26: [2023-05-10 12:37:39,182] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +23: [2023-05-10 12:37:39,182] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt... + 6: [2023-05-10 12:37:39,182] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... + 1: [2023-05-10 12:37:39,182] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... + 2: [2023-05-10 12:37:39,182] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... + 5: [2023-05-10 12:37:39,183] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... + 8: [2023-05-10 12:37:39,183] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... + 1: [2023-05-10 12:37:39,184] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... + 8: [2023-05-10 12:37:39,184] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. + 8: [2023-05-10 12:37:39,184] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +15: [2023-05-10 12:37:39,183] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +30: [2023-05-10 12:37:39,184] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +30: [2023-05-10 12:37:39,184] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +23: [2023-05-10 12:37:39,184] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... + 2: [2023-05-10 12:37:39,184] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +15: [2023-05-10 12:37:39,184] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. + 0: [2023-05-10 12:37:39,184] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt. + 1: [2023-05-10 12:37:39,184] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... + 1: [2023-05-10 12:37:39,185] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... + 0: [2023-05-10 12:37:39,185] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt. + 0: [2023-05-10 12:37:39,185] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt. + 0: [2023-05-10 12:37:39,185] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt. + 5: [2023-05-10 12:37:39,186] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt. +13: [2023-05-10 12:37:39,186] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... + 5: [2023-05-10 12:37:39,186] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt. + 5: [2023-05-10 12:37:39,186] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt. +13: [2023-05-10 12:37:39,186] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... + 1: [2023-05-10 12:37:39,187] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. + 5: [2023-05-10 12:37:39,187] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt. +27: [2023-05-10 12:37:39,187] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt. +18: [2023-05-10 12:37:39,187] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +27: [2023-05-10 12:37:39,187] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt. + 8: [2023-05-10 12:37:39,187] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +27: [2023-05-10 12:37:39,187] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt. +27: [2023-05-10 12:37:39,187] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt. +30: [2023-05-10 12:37:39,187] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +25: [2023-05-10 12:37:39,187] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. + 8: [2023-05-10 12:37:39,188] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +22: [2023-05-10 12:37:39,188] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +18: [2023-05-10 12:37:39,188] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +22: [2023-05-10 12:37:39,188] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... + 9: [2023-05-10 12:37:39,188] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. + 7: [2023-05-10 12:37:39,189] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. + 9: [2023-05-10 12:37:39,189] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt... +22: [2023-05-10 12:37:39,189] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... + 1: [2023-05-10 12:37:39,189] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. + 1: [2023-05-10 12:37:39,189] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +22: [2023-05-10 12:37:39,189] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... + 1: [2023-05-10 12:37:39,190] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt... +25: [2023-05-10 12:37:39,190] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt... + 8: [2023-05-10 12:37:39,190] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt... + 7: [2023-05-10 12:37:39,190] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. + 7: [2023-05-10 12:37:39,190] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. + 8: [2023-05-10 12:37:39,190] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt... + 0: [2023-05-10 12:37:39,190] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +30: [2023-05-10 12:37:39,190] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +23: [2023-05-10 12:37:39,190] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. + 3: [2023-05-10 12:37:39,191] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... + 7: [2023-05-10 12:37:39,191] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt... +26: [2023-05-10 12:37:39,191] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +18: [2023-05-10 12:37:39,191] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +15: [2023-05-10 12:37:39,191] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. + 1: [2023-05-10 12:37:39,192] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt... +18: [2023-05-10 12:37:39,192] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... + 7: [2023-05-10 12:37:39,192] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt... +15: [2023-05-10 12:37:39,192] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt... + 7: [2023-05-10 12:37:39,192] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt... + 3: [2023-05-10 12:37:39,192] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... + 1: [2023-05-10 12:37:39,193] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt... +28: [2023-05-10 12:37:39,193] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt. +28: [2023-05-10 12:37:39,193] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt. +28: [2023-05-10 12:37:39,193] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt. +13: [2023-05-10 12:37:39,193] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt. +13: [2023-05-10 12:37:39,193] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt. +28: [2023-05-10 12:37:39,193] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt. + 2: [2023-05-10 12:37:39,193] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +13: [2023-05-10 12:37:39,193] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt. +23: [2023-05-10 12:37:39,193] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt... +13: [2023-05-10 12:37:39,193] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt. +30: [2023-05-10 12:37:39,193] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +26: [2023-05-10 12:37:39,193] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... + 8: [2023-05-10 12:37:39,194] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. + 8: [2023-05-10 12:37:39,194] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +15: [2023-05-10 12:37:39,194] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +31: [2023-05-10 12:37:39,194] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt. +29: [2023-05-10 12:37:39,194] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt. +29: [2023-05-10 12:37:39,194] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt. + 3: [2023-05-10 12:37:39,194] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +31: [2023-05-10 12:37:39,194] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt. +31: [2023-05-10 12:37:39,194] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt. + 2: [2023-05-10 12:37:39,194] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +29: [2023-05-10 12:37:39,194] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt. + 2: [2023-05-10 12:37:39,194] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt... +29: [2023-05-10 12:37:39,194] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt. +20: [2023-05-10 12:37:39,194] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt. + 2: [2023-05-10 12:37:39,194] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +31: [2023-05-10 12:37:39,194] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt. +15: [2023-05-10 12:37:39,194] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +15: [2023-05-10 12:37:39,194] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +15: [2023-05-10 12:37:39,195] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... + 3: [2023-05-10 12:37:39,195] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +15: [2023-05-10 12:37:39,195] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +15: [2023-05-10 12:37:39,195] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt... +20: [2023-05-10 12:37:39,195] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt. +20: [2023-05-10 12:37:39,195] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt. +30: [2023-05-10 12:37:39,195] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +20: [2023-05-10 12:37:39,195] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt. + 8: [2023-05-10 12:37:39,195] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... + 8: [2023-05-10 12:37:39,196] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +23: [2023-05-10 12:37:39,195] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +23: [2023-05-10 12:37:39,195] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. + 8: [2023-05-10 12:37:39,196] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt... + 8: [2023-05-10 12:37:39,196] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt... + 2: [2023-05-10 12:37:39,196] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt... +27: [2023-05-10 12:37:39,197] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +27: [2023-05-10 12:37:39,197] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... + 5: [2023-05-10 12:37:39,197] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... + 2: [2023-05-10 12:37:39,197] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt... + 4: [2023-05-10 12:37:39,197] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. + 4: [2023-05-10 12:37:39,197] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. + 4: [2023-05-10 12:37:39,197] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. + 5: [2023-05-10 12:37:39,197] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +23: [2023-05-10 12:37:39,197] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt... + 5: [2023-05-10 12:37:39,197] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +23: [2023-05-10 12:37:39,198] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt... +19: [2023-05-10 12:37:39,198] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. + 0: [2023-05-10 12:37:39,198] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +19: [2023-05-10 12:37:39,199] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +19: [2023-05-10 12:37:39,199] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +19: [2023-05-10 12:37:39,199] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +19: [2023-05-10 12:37:39,199] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +19: [2023-05-10 12:37:39,199] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +19: [2023-05-10 12:37:39,199] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +19: [2023-05-10 12:37:39,199] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +19: [2023-05-10 12:37:39,199] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +19: [2023-05-10 12:37:39,199] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +27: [2023-05-10 12:37:39,199] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +19: [2023-05-10 12:37:39,199] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt... +19: [2023-05-10 12:37:39,199] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt... +19: [2023-05-10 12:37:39,199] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +19: [2023-05-10 12:37:39,199] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt... +19: [2023-05-10 12:37:39,199] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt... +19: [2023-05-10 12:37:39,199] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +27: [2023-05-10 12:37:39,199] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... + 4: [2023-05-10 12:37:39,199] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt... + 4: [2023-05-10 12:37:39,199] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt... + 4: [2023-05-10 12:37:39,199] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt... + 5: [2023-05-10 12:37:39,200] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... + 0: [2023-05-10 12:37:39,201] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... + 0: [2023-05-10 12:37:39,201] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +28: [2023-05-10 12:37:39,202] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... + 9: [2023-05-10 12:37:39,202] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. + 0: [2023-05-10 12:37:39,202] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +28: [2023-05-10 12:37:39,203] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +28: [2023-05-10 12:37:39,203] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +28: [2023-05-10 12:37:39,203] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +21: [2023-05-10 12:37:39,203] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt. +21: [2023-05-10 12:37:39,204] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt. + 9: [2023-05-10 12:37:39,203] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. + 9: [2023-05-10 12:37:39,203] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. + 9: [2023-05-10 12:37:39,204] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt... +21: [2023-05-10 12:37:39,204] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt. + 0: [2023-05-10 12:37:39,204] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +21: [2023-05-10 12:37:39,204] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_05-model_01-model_states.pt. +13: [2023-05-10 12:37:39,205] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +15: [2023-05-10 12:37:39,206] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +15: [2023-05-10 12:37:39,206] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... + 9: [2023-05-10 12:37:39,206] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt... + 9: [2023-05-10 12:37:39,206] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt... +20: [2023-05-10 12:37:39,206] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... + 3: [2023-05-10 12:37:39,206] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +22: [2023-05-10 12:37:39,206] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +18: [2023-05-10 12:37:39,206] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. + 3: [2023-05-10 12:37:39,206] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt... +22: [2023-05-10 12:37:39,207] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt... +13: [2023-05-10 12:37:39,207] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +13: [2023-05-10 12:37:39,207] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +18: [2023-05-10 12:37:39,207] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt... +20: [2023-05-10 12:37:39,207] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +31: [2023-05-10 12:37:39,207] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +29: [2023-05-10 12:37:39,208] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +29: [2023-05-10 12:37:39,208] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +31: [2023-05-10 12:37:39,208] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +31: [2023-05-10 12:37:39,208] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +13: [2023-05-10 12:37:39,208] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +15: [2023-05-10 12:37:39,208] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +20: [2023-05-10 12:37:39,209] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +29: [2023-05-10 12:37:39,209] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +29: [2023-05-10 12:37:39,209] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +22: [2023-05-10 12:37:39,209] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +22: [2023-05-10 12:37:39,209] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +22: [2023-05-10 12:37:39,209] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +15: [2023-05-10 12:37:39,209] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +22: [2023-05-10 12:37:39,209] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt... +22: [2023-05-10 12:37:39,209] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt... +22: [2023-05-10 12:37:39,209] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt... +20: [2023-05-10 12:37:39,209] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +15: [2023-05-10 12:37:39,211] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt... + 1: [2023-05-10 12:37:39,211] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. + 1: [2023-05-10 12:37:39,211] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +15: [2023-05-10 12:37:39,212] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt... +31: [2023-05-10 12:37:39,212] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +27: [2023-05-10 12:37:39,212] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +27: [2023-05-10 12:37:39,213] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt... +19: [2023-05-10 12:37:39,213] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. + 5: [2023-05-10 12:37:39,214] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. + 5: [2023-05-10 12:37:39,214] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. + 3: [2023-05-10 12:37:39,215] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +19: [2023-05-10 12:37:39,215] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. + 3: [2023-05-10 12:37:39,215] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt... + 5: [2023-05-10 12:37:39,215] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt... + 5: [2023-05-10 12:37:39,215] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt... +27: [2023-05-10 12:37:39,215] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +27: [2023-05-10 12:37:39,216] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt... + 1: [2023-05-10 12:37:39,216] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +28: [2023-05-10 12:37:39,215] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. + 1: [2023-05-10 12:37:39,216] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +28: [2023-05-10 12:37:39,216] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt... +30: [2023-05-10 12:37:39,217] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt. +28: [2023-05-10 12:37:39,217] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +28: [2023-05-10 12:37:39,217] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt... +30: [2023-05-10 12:37:39,217] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt. +20: [2023-05-10 12:37:39,218] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +30: [2023-05-10 12:37:39,218] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt. +30: [2023-05-10 12:37:39,218] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt. +18: [2023-05-10 12:37:39,218] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +19: [2023-05-10 12:37:39,218] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +21: [2023-05-10 12:37:39,218] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +20: [2023-05-10 12:37:39,218] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt... +13: [2023-05-10 12:37:39,219] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +13: [2023-05-10 12:37:39,219] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt... +21: [2023-05-10 12:37:39,220] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +18: [2023-05-10 12:37:39,220] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt... +21: [2023-05-10 12:37:39,220] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +28: [2023-05-10 12:37:39,220] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +28: [2023-05-10 12:37:39,220] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt... +20: [2023-05-10 12:37:39,221] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +31: [2023-05-10 12:37:39,220] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +20: [2023-05-10 12:37:39,221] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt... +21: [2023-05-10 12:37:39,221] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt... +31: [2023-05-10 12:37:39,221] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt... + 3: [2023-05-10 12:37:39,221] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +19: [2023-05-10 12:37:39,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +18: [2023-05-10 12:37:39,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +18: [2023-05-10 12:37:39,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +18: [2023-05-10 12:37:39,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +18: [2023-05-10 12:37:39,223] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +19: [2023-05-10 12:37:39,223] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +28: [2023-05-10 12:37:39,223] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. + 1: [2023-05-10 12:37:39,223] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... + 1: [2023-05-10 12:37:39,223] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +28: [2023-05-10 12:37:39,223] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt... + 5: [2023-05-10 12:37:39,223] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. + 0: [2023-05-10 12:37:39,224] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. + 3: [2023-05-10 12:37:39,224] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt... +19: [2023-05-10 12:37:39,224] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... + 3: [2023-05-10 12:37:39,224] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. + 0: [2023-05-10 12:37:39,224] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt... +31: [2023-05-10 12:37:39,224] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +31: [2023-05-10 12:37:39,225] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt... +27: [2023-05-10 12:37:39,225] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. + 5: [2023-05-10 12:37:39,226] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt... +20: [2023-05-10 12:37:39,225] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +20: [2023-05-10 12:37:39,225] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +20: [2023-05-10 12:37:39,225] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt... +20: [2023-05-10 12:37:39,225] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt... +29: [2023-05-10 12:37:39,226] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +29: [2023-05-10 12:37:39,226] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt... +27: [2023-05-10 12:37:39,227] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt... +30: [2023-05-10 12:37:39,227] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... + 3: [2023-05-10 12:37:39,227] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt... + 1: [2023-05-10 12:37:39,227] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... + 1: [2023-05-10 12:37:39,227] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +30: [2023-05-10 12:37:39,227] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +19: [2023-05-10 12:37:39,227] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... + 0: [2023-05-10 12:37:39,227] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +27: [2023-05-10 12:37:39,227] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +30: [2023-05-10 12:37:39,227] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +30: [2023-05-10 12:37:39,227] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +29: [2023-05-10 12:37:39,229] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +29: [2023-05-10 12:37:39,229] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +31: [2023-05-10 12:37:39,229] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +29: [2023-05-10 12:37:39,229] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt... +29: [2023-05-10 12:37:39,229] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt... + 0: [2023-05-10 12:37:39,229] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt... +31: [2023-05-10 12:37:39,229] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt... +19: [2023-05-10 12:37:39,230] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +27: [2023-05-10 12:37:39,230] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt... + 5: [2023-05-10 12:37:39,231] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +31: [2023-05-10 12:37:39,232] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +31: [2023-05-10 12:37:39,232] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt... +29: [2023-05-10 12:37:39,232] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. + 0: [2023-05-10 12:37:39,232] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. + 0: [2023-05-10 12:37:39,232] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. + 5: [2023-05-10 12:37:39,233] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt... +29: [2023-05-10 12:37:39,234] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt... + 0: [2023-05-10 12:37:39,235] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt... +13: [2023-05-10 12:37:39,234] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +13: [2023-05-10 12:37:39,234] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +13: [2023-05-10 12:37:39,234] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. + 0: [2023-05-10 12:37:39,235] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt... +18: [2023-05-10 12:37:39,236] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +18: [2023-05-10 12:37:39,236] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +13: [2023-05-10 12:37:39,236] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt... +13: [2023-05-10 12:37:39,237] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt... +13: [2023-05-10 12:37:39,237] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt... +18: [2023-05-10 12:37:39,237] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +18: [2023-05-10 12:37:39,237] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +18: [2023-05-10 12:37:39,238] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +30: [2023-05-10 12:37:39,240] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +18: [2023-05-10 12:37:39,240] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +30: [2023-05-10 12:37:39,241] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt... +18: [2023-05-10 12:37:39,241] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt... +30: [2023-05-10 12:37:39,241] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +30: [2023-05-10 12:37:39,241] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt... +18: [2023-05-10 12:37:39,242] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt... +30: [2023-05-10 12:37:39,243] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +30: [2023-05-10 12:37:39,243] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt... +21: [2023-05-10 12:37:39,248] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +30: [2023-05-10 12:37:39,248] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +30: [2023-05-10 12:37:39,249] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt... +17: [2023-05-10 12:37:39,248] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt. +17: [2023-05-10 12:37:39,248] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt. +21: [2023-05-10 12:37:39,249] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt... +17: [2023-05-10 12:37:39,248] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt. +17: [2023-05-10 12:37:39,249] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt. +21: [2023-05-10 12:37:39,252] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +21: [2023-05-10 12:37:39,253] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +21: [2023-05-10 12:37:39,253] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_00-model_states.pt. +21: [2023-05-10 12:37:39,256] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt... +21: [2023-05-10 12:37:39,257] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt... +21: [2023-05-10 12:37:39,258] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt... +17: [2023-05-10 12:37:39,258] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +17: [2023-05-10 12:37:39,258] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +17: [2023-05-10 12:37:39,259] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +17: [2023-05-10 12:37:39,259] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +12: [2023-05-10 12:37:39,267] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt. +12: [2023-05-10 12:37:39,267] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt. +12: [2023-05-10 12:37:39,268] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt. +12: [2023-05-10 12:37:39,268] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt. +12: [2023-05-10 12:37:39,277] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +12: [2023-05-10 12:37:39,278] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +12: [2023-05-10 12:37:39,278] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +12: [2023-05-10 12:37:39,278] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +10: [2023-05-10 12:37:39,283] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +10: [2023-05-10 12:37:39,283] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +10: [2023-05-10 12:37:39,283] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +10: [2023-05-10 12:37:39,283] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +10: [2023-05-10 12:37:39,283] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +10: [2023-05-10 12:37:39,283] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +10: [2023-05-10 12:37:39,284] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +10: [2023-05-10 12:37:39,284] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... + 4: [2023-05-10 12:37:39,288] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. + 4: [2023-05-10 12:37:39,288] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... + 4: [2023-05-10 12:37:39,288] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. + 4: [2023-05-10 12:37:39,288] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. + 4: [2023-05-10 12:37:39,288] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... + 4: [2023-05-10 12:37:39,288] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... + 4: [2023-05-10 12:37:39,289] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. + 4: [2023-05-10 12:37:39,289] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +10: [2023-05-10 12:37:39,296] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt. +10: [2023-05-10 12:37:39,297] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt. +10: [2023-05-10 12:37:39,297] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt. +10: [2023-05-10 12:37:39,297] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt. + 4: [2023-05-10 12:37:39,301] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +10: [2023-05-10 12:37:39,303] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +10: [2023-05-10 12:37:39,303] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. + 4: [2023-05-10 12:37:39,304] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +10: [2023-05-10 12:37:39,305] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. + 4: [2023-05-10 12:37:39,306] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. + 4: [2023-05-10 12:37:39,307] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +12: [2023-05-10 12:37:39,308] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +12: [2023-05-10 12:37:39,308] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +12: [2023-05-10 12:37:39,308] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +10: [2023-05-10 12:37:39,308] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +12: [2023-05-10 12:37:39,308] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +12: [2023-05-10 12:37:39,308] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +12: [2023-05-10 12:37:39,308] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +12: [2023-05-10 12:37:39,308] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +12: [2023-05-10 12:37:39,308] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +12: [2023-05-10 12:37:39,308] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +12: [2023-05-10 12:37:39,308] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +12: [2023-05-10 12:37:39,308] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt... +12: [2023-05-10 12:37:39,308] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt... +12: [2023-05-10 12:37:39,308] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt... +12: [2023-05-10 12:37:39,308] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt... +12: [2023-05-10 12:37:39,308] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +24: [2023-05-10 12:37:39,308] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +12: [2023-05-10 12:37:39,308] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +24: [2023-05-10 12:37:39,308] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +24: [2023-05-10 12:37:39,308] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +24: [2023-05-10 12:37:39,309] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +24: [2023-05-10 12:37:39,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +24: [2023-05-10 12:37:39,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +24: [2023-05-10 12:37:39,309] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +24: [2023-05-10 12:37:39,309] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +10: [2023-05-10 12:37:39,309] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +16: [2023-05-10 12:37:39,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt. +16: [2023-05-10 12:37:39,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt. +10: [2023-05-10 12:37:39,310] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +16: [2023-05-10 12:37:39,310] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt. + 4: [2023-05-10 12:37:39,310] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +16: [2023-05-10 12:37:39,310] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt. +10: [2023-05-10 12:37:39,312] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +10: [2023-05-10 12:37:39,313] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... + 4: [2023-05-10 12:37:39,315] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... + 6: [2023-05-10 12:37:39,315] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. + 6: [2023-05-10 12:37:39,315] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. + 6: [2023-05-10 12:37:39,315] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. + 6: [2023-05-10 12:37:39,315] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. + 6: [2023-05-10 12:37:39,315] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. + 6: [2023-05-10 12:37:39,315] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. + 6: [2023-05-10 12:37:39,315] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. + 6: [2023-05-10 12:37:39,315] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... + 6: [2023-05-10 12:37:39,315] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... + 6: [2023-05-10 12:37:39,316] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... + 6: [2023-05-10 12:37:39,316] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. + 6: [2023-05-10 12:37:39,316] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... + 6: [2023-05-10 12:37:39,316] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt... + 6: [2023-05-10 12:37:39,316] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt... + 6: [2023-05-10 12:37:39,316] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt... + 6: [2023-05-10 12:37:39,316] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt... + 4: [2023-05-10 12:37:39,317] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +10: [2023-05-10 12:37:39,318] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... + 4: [2023-05-10 12:37:39,320] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +16: [2023-05-10 12:37:39,321] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +16: [2023-05-10 12:37:39,321] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +16: [2023-05-10 12:37:39,321] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +24: [2023-05-10 12:37:39,321] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +10: [2023-05-10 12:37:39,322] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +10: [2023-05-10 12:37:39,323] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +24: [2023-05-10 12:37:39,323] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +24: [2023-05-10 12:37:39,323] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt. +24: [2023-05-10 12:37:39,324] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt. +24: [2023-05-10 12:37:39,324] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +16: [2023-05-10 12:37:39,324] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +24: [2023-05-10 12:37:39,324] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +24: [2023-05-10 12:37:39,325] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt. +24: [2023-05-10 12:37:39,325] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt. +12: [2023-05-10 12:37:39,325] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +12: [2023-05-10 12:37:39,325] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +12: [2023-05-10 12:37:39,325] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +12: [2023-05-10 12:37:39,325] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +10: [2023-05-10 12:37:39,326] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +10: [2023-05-10 12:37:39,329] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +10: [2023-05-10 12:37:39,329] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. + 8: [2023-05-10 12:37:39,330] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +11: [2023-05-10 12:37:39,330] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt. + 8: [2023-05-10 12:37:39,330] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +11: [2023-05-10 12:37:39,330] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt. +10: [2023-05-10 12:37:39,330] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +10: [2023-05-10 12:37:39,330] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt... +10: [2023-05-10 12:37:39,330] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt... +10: [2023-05-10 12:37:39,330] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt... +11: [2023-05-10 12:37:39,332] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt. + 6: [2023-05-10 12:37:39,332] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. + 6: [2023-05-10 12:37:39,332] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. + 8: [2023-05-10 12:37:39,332] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. + 8: [2023-05-10 12:37:39,332] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... + 6: [2023-05-10 12:37:39,333] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +11: [2023-05-10 12:37:39,333] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt. + 8: [2023-05-10 12:37:39,333] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. + 6: [2023-05-10 12:37:39,333] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. + 8: [2023-05-10 12:37:39,333] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... + 8: [2023-05-10 12:37:39,333] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. + 8: [2023-05-10 12:37:39,334] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +12: [2023-05-10 12:37:39,334] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +12: [2023-05-10 12:37:39,335] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +10: [2023-05-10 12:37:39,336] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +10: [2023-05-10 12:37:39,336] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt... +24: [2023-05-10 12:37:39,336] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +12: [2023-05-10 12:37:39,336] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +14: [2023-05-10 12:37:39,336] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt. +14: [2023-05-10 12:37:39,336] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt. +12: [2023-05-10 12:37:39,337] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +14: [2023-05-10 12:37:39,337] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt. +24: [2023-05-10 12:37:39,337] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +24: [2023-05-10 12:37:39,337] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +24: [2023-05-10 12:37:39,339] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +24: [2023-05-10 12:37:39,339] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +24: [2023-05-10 12:37:39,339] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... + 6: [2023-05-10 12:37:39,341] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... + 6: [2023-05-10 12:37:39,341] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +14: [2023-05-10 12:37:39,342] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt. +24: [2023-05-10 12:37:39,342] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... + 6: [2023-05-10 12:37:39,343] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +24: [2023-05-10 12:37:39,343] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +11: [2023-05-10 12:37:39,344] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... + 6: [2023-05-10 12:37:39,345] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +11: [2023-05-10 12:37:39,345] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +11: [2023-05-10 12:37:39,347] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +11: [2023-05-10 12:37:39,347] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... + 8: [2023-05-10 12:37:39,347] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +14: [2023-05-10 12:37:39,349] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +14: [2023-05-10 12:37:39,349] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +27: [2023-05-10 12:37:39,350] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +27: [2023-05-10 12:37:39,350] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +27: [2023-05-10 12:37:39,350] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +27: [2023-05-10 12:37:39,350] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +27: [2023-05-10 12:37:39,350] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +27: [2023-05-10 12:37:39,350] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. + 2: [2023-05-10 12:37:39,350] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +27: [2023-05-10 12:37:39,350] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... + 2: [2023-05-10 12:37:39,350] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. + 2: [2023-05-10 12:37:39,350] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. + 2: [2023-05-10 12:37:39,350] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... + 2: [2023-05-10 12:37:39,350] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... + 2: [2023-05-10 12:37:39,350] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +14: [2023-05-10 12:37:39,351] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +27: [2023-05-10 12:37:39,351] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... + 2: [2023-05-10 12:37:39,352] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. + 2: [2023-05-10 12:37:39,352] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +24: [2023-05-10 12:37:39,354] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +14: [2023-05-10 12:37:39,354] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +24: [2023-05-10 12:37:39,355] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt... +24: [2023-05-10 12:37:39,355] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +24: [2023-05-10 12:37:39,355] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt... + 8: [2023-05-10 12:37:39,355] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. + 8: [2023-05-10 12:37:39,355] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +16: [2023-05-10 12:37:39,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +16: [2023-05-10 12:37:39,356] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... + 8: [2023-05-10 12:37:39,356] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +16: [2023-05-10 12:37:39,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +16: [2023-05-10 12:37:39,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +16: [2023-05-10 12:37:39,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +16: [2023-05-10 12:37:39,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +16: [2023-05-10 12:37:39,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +16: [2023-05-10 12:37:39,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. + 8: [2023-05-10 12:37:39,359] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +24: [2023-05-10 12:37:39,359] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +24: [2023-05-10 12:37:39,359] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt... +27: [2023-05-10 12:37:39,362] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +27: [2023-05-10 12:37:39,362] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +27: [2023-05-10 12:37:39,363] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. + 2: [2023-05-10 12:37:39,364] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. + 2: [2023-05-10 12:37:39,364] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +20: [2023-05-10 12:37:39,365] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. + 8: [2023-05-10 12:37:39,365] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +20: [2023-05-10 12:37:39,365] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +24: [2023-05-10 12:37:39,366] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. + 8: [2023-05-10 12:37:39,366] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... + 2: [2023-05-10 12:37:39,366] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +20: [2023-05-10 12:37:39,367] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +20: [2023-05-10 12:37:39,367] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +24: [2023-05-10 12:37:39,367] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt... + 2: [2023-05-10 12:37:39,367] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. + 8: [2023-05-10 12:37:39,368] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +20: [2023-05-10 12:37:39,369] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +20: [2023-05-10 12:37:39,369] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +20: [2023-05-10 12:37:39,369] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +27: [2023-05-10 12:37:39,371] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +27: [2023-05-10 12:37:39,371] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +20: [2023-05-10 12:37:39,371] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... + 2: [2023-05-10 12:37:39,373] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +27: [2023-05-10 12:37:39,374] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... + 2: [2023-05-10 12:37:39,375] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... + 2: [2023-05-10 12:37:39,377] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... + 2: [2023-05-10 12:37:39,377] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... + 0: [2023-05-10 12:37:39,378] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. + 0: [2023-05-10 12:37:39,378] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. + 0: [2023-05-10 12:37:39,378] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. + 0: [2023-05-10 12:37:39,378] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... + 0: [2023-05-10 12:37:39,378] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... + 0: [2023-05-10 12:37:39,378] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. + 0: [2023-05-10 12:37:39,378] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... + 7: [2023-05-10 12:37:39,378] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. + 7: [2023-05-10 12:37:39,378] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... + 7: [2023-05-10 12:37:39,378] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +17: [2023-05-10 12:37:39,378] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +17: [2023-05-10 12:37:39,378] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +17: [2023-05-10 12:37:39,378] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +17: [2023-05-10 12:37:39,378] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +27: [2023-05-10 12:37:39,378] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +17: [2023-05-10 12:37:39,378] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +17: [2023-05-10 12:37:39,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. + 7: [2023-05-10 12:37:39,378] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +17: [2023-05-10 12:37:39,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +17: [2023-05-10 12:37:39,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. + 7: [2023-05-10 12:37:39,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... + 7: [2023-05-10 12:37:39,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +17: [2023-05-10 12:37:39,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +17: [2023-05-10 12:37:39,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +25: [2023-05-10 12:37:39,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. + 7: [2023-05-10 12:37:39,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +17: [2023-05-10 12:37:39,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. + 7: [2023-05-10 12:37:39,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +13: [2023-05-10 12:37:39,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +25: [2023-05-10 12:37:39,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +25: [2023-05-10 12:37:39,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +13: [2023-05-10 12:37:39,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +25: [2023-05-10 12:37:39,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +25: [2023-05-10 12:37:39,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +17: [2023-05-10 12:37:39,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt... +17: [2023-05-10 12:37:39,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt... +17: [2023-05-10 12:37:39,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt... +25: [2023-05-10 12:37:39,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +17: [2023-05-10 12:37:39,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt... +25: [2023-05-10 12:37:39,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. + 9: [2023-05-10 12:37:39,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +25: [2023-05-10 12:37:39,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... + 9: [2023-05-10 12:37:39,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +13: [2023-05-10 12:37:39,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +13: [2023-05-10 12:37:39,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +13: [2023-05-10 12:37:39,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. + 0: [2023-05-10 12:37:39,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +13: [2023-05-10 12:37:39,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +13: [2023-05-10 12:37:39,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +13: [2023-05-10 12:37:39,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... + 9: [2023-05-10 12:37:39,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. + 9: [2023-05-10 12:37:39,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. + 9: [2023-05-10 12:37:39,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. + 9: [2023-05-10 12:37:39,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... + 9: [2023-05-10 12:37:39,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... + 9: [2023-05-10 12:37:39,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +20: [2023-05-10 12:37:39,380] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +17: [2023-05-10 12:37:39,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +15: [2023-05-10 12:37:39,380] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt. +15: [2023-05-10 12:37:39,381] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt. +20: [2023-05-10 12:37:39,381] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. + 5: [2023-05-10 12:37:39,380] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. + 5: [2023-05-10 12:37:39,380] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. + 5: [2023-05-10 12:37:39,380] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. + 5: [2023-05-10 12:37:39,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... + 5: [2023-05-10 12:37:39,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... + 5: [2023-05-10 12:37:39,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... + 5: [2023-05-10 12:37:39,381] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +21: [2023-05-10 12:37:39,381] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +21: [2023-05-10 12:37:39,381] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. + 5: [2023-05-10 12:37:39,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +11: [2023-05-10 12:37:39,381] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +11: [2023-05-10 12:37:39,381] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +11: [2023-05-10 12:37:39,381] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +11: [2023-05-10 12:37:39,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +11: [2023-05-10 12:37:39,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +11: [2023-05-10 12:37:39,381] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +11: [2023-05-10 12:37:39,381] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +11: [2023-05-10 12:37:39,381] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +21: [2023-05-10 12:37:39,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +21: [2023-05-10 12:37:39,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +11: [2023-05-10 12:37:39,381] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +11: [2023-05-10 12:37:39,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +11: [2023-05-10 12:37:39,381] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +21: [2023-05-10 12:37:39,382] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +21: [2023-05-10 12:37:39,382] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +21: [2023-05-10 12:37:39,382] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +21: [2023-05-10 12:37:39,382] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +11: [2023-05-10 12:37:39,382] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt... +11: [2023-05-10 12:37:39,382] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt... +11: [2023-05-10 12:37:39,382] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt... +11: [2023-05-10 12:37:39,382] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt... +20: [2023-05-10 12:37:39,383] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +11: [2023-05-10 12:37:39,383] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +15: [2023-05-10 12:37:39,383] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt. +15: [2023-05-10 12:37:39,384] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt. +14: [2023-05-10 12:37:39,386] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +29: [2023-05-10 12:37:39,387] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +29: [2023-05-10 12:37:39,387] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +14: [2023-05-10 12:37:39,387] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +14: [2023-05-10 12:37:39,387] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +14: [2023-05-10 12:37:39,387] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +29: [2023-05-10 12:37:39,387] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +14: [2023-05-10 12:37:39,387] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +14: [2023-05-10 12:37:39,387] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +14: [2023-05-10 12:37:39,387] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +29: [2023-05-10 12:37:39,387] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +14: [2023-05-10 12:37:39,387] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +14: [2023-05-10 12:37:39,387] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +14: [2023-05-10 12:37:39,387] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt... +14: [2023-05-10 12:37:39,387] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt... +14: [2023-05-10 12:37:39,387] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt... +14: [2023-05-10 12:37:39,387] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +14: [2023-05-10 12:37:39,387] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt... +27: [2023-05-10 12:37:39,387] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +29: [2023-05-10 12:37:39,387] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +29: [2023-05-10 12:37:39,387] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +14: [2023-05-10 12:37:39,389] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +14: [2023-05-10 12:37:39,389] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +17: [2023-05-10 12:37:39,390] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +29: [2023-05-10 12:37:39,390] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +25: [2023-05-10 12:37:39,390] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +13: [2023-05-10 12:37:39,390] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +29: [2023-05-10 12:37:39,390] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +17: [2023-05-10 12:37:39,391] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. + 7: [2023-05-10 12:37:39,391] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +20: [2023-05-10 12:37:39,391] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +25: [2023-05-10 12:37:39,391] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. + 9: [2023-05-10 12:37:39,392] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. + 9: [2023-05-10 12:37:39,392] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +20: [2023-05-10 12:37:39,393] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +28: [2023-05-10 12:37:39,393] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +15: [2023-05-10 12:37:39,393] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +28: [2023-05-10 12:37:39,393] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +15: [2023-05-10 12:37:39,393] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +28: [2023-05-10 12:37:39,393] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +28: [2023-05-10 12:37:39,393] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +28: [2023-05-10 12:37:39,393] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +28: [2023-05-10 12:37:39,393] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +15: [2023-05-10 12:37:39,393] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... + 9: [2023-05-10 12:37:39,394] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +17: [2023-05-10 12:37:39,394] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +25: [2023-05-10 12:37:39,394] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +25: [2023-05-10 12:37:39,394] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +20: [2023-05-10 12:37:39,394] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +26: [2023-05-10 12:37:39,394] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +26: [2023-05-10 12:37:39,394] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +26: [2023-05-10 12:37:39,395] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... + 9: [2023-05-10 12:37:39,395] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +28: [2023-05-10 12:37:39,395] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +26: [2023-05-10 12:37:39,395] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +26: [2023-05-10 12:37:39,395] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +28: [2023-05-10 12:37:39,396] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... + 1: [2023-05-10 12:37:39,396] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. + 1: [2023-05-10 12:37:39,396] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +15: [2023-05-10 12:37:39,396] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... + 1: [2023-05-10 12:37:39,396] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... + 1: [2023-05-10 12:37:39,396] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... + 1: [2023-05-10 12:37:39,396] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +26: [2023-05-10 12:37:39,396] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... + 1: [2023-05-10 12:37:39,396] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... + 1: [2023-05-10 12:37:39,396] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. + 1: [2023-05-10 12:37:39,396] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +21: [2023-05-10 12:37:39,396] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +21: [2023-05-10 12:37:39,396] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +11: [2023-05-10 12:37:39,396] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. + 5: [2023-05-10 12:37:39,397] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. + 5: [2023-05-10 12:37:39,397] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. + 5: [2023-05-10 12:37:39,397] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +11: [2023-05-10 12:37:39,397] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. + 5: [2023-05-10 12:37:39,397] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +11: [2023-05-10 12:37:39,397] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +18: [2023-05-10 12:37:39,397] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +18: [2023-05-10 12:37:39,397] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +18: [2023-05-10 12:37:39,397] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +18: [2023-05-10 12:37:39,397] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +18: [2023-05-10 12:37:39,397] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +26: [2023-05-10 12:37:39,397] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +18: [2023-05-10 12:37:39,397] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +18: [2023-05-10 12:37:39,398] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +18: [2023-05-10 12:37:39,398] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +26: [2023-05-10 12:37:39,398] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... + 7: [2023-05-10 12:37:39,398] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. + 7: [2023-05-10 12:37:39,398] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. + 7: [2023-05-10 12:37:39,398] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +20: [2023-05-10 12:37:39,399] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. + 0: [2023-05-10 12:37:39,399] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. + 0: [2023-05-10 12:37:39,399] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +16: [2023-05-10 12:37:39,356] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +16: [2023-05-10 12:37:39,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +16: [2023-05-10 12:37:39,356] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +16: [2023-05-10 12:37:39,356] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +16: [2023-05-10 12:37:39,357] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt... +16: [2023-05-10 12:37:39,357] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt... +21: [2023-05-10 12:37:39,399] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +16: [2023-05-10 12:37:39,357] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt... +16: [2023-05-10 12:37:39,357] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt... +16: [2023-05-10 12:37:39,368] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +16: [2023-05-10 12:37:39,369] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +16: [2023-05-10 12:37:39,373] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +16: [2023-05-10 12:37:39,373] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +16: [2023-05-10 12:37:39,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +21: [2023-05-10 12:37:39,399] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +16: [2023-05-10 12:37:39,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +16: [2023-05-10 12:37:39,384] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +16: [2023-05-10 12:37:39,385] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +14: [2023-05-10 12:37:39,400] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +13: [2023-05-10 12:37:39,400] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +13: [2023-05-10 12:37:39,400] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +13: [2023-05-10 12:37:39,400] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +17: [2023-05-10 12:37:39,401] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +29: [2023-05-10 12:37:39,400] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +14: [2023-05-10 12:37:39,401] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. + 7: [2023-05-10 12:37:39,401] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +17: [2023-05-10 12:37:39,402] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. + 9: [2023-05-10 12:37:39,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +14: [2023-05-10 12:37:39,404] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. + 9: [2023-05-10 12:37:39,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +29: [2023-05-10 12:37:39,404] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +25: [2023-05-10 12:37:39,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +25: [2023-05-10 12:37:39,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +13: [2023-05-10 12:37:39,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +25: [2023-05-10 12:37:39,406] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +28: [2023-05-10 12:37:39,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. + 9: [2023-05-10 12:37:39,406] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +17: [2023-05-10 12:37:39,406] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +17: [2023-05-10 12:37:39,406] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... + 5: [2023-05-10 12:37:39,406] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... + 0: [2023-05-10 12:37:39,406] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. + 5: [2023-05-10 12:37:39,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +25: [2023-05-10 12:37:39,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +26: [2023-05-10 12:37:39,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. + 9: [2023-05-10 12:37:39,408] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +14: [2023-05-10 12:37:39,408] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. + 7: [2023-05-10 12:37:39,408] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... + 5: [2023-05-10 12:37:39,409] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +20: [2023-05-10 12:37:39,409] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... + 7: [2023-05-10 12:37:39,409] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... + 5: [2023-05-10 12:37:39,410] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +28: [2023-05-10 12:37:39,409] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +11: [2023-05-10 12:37:39,410] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +13: [2023-05-10 12:37:39,410] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +11: [2023-05-10 12:37:39,411] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. + 7: [2023-05-10 12:37:39,411] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +13: [2023-05-10 12:37:39,411] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +29: [2023-05-10 12:37:39,411] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +15: [2023-05-10 12:37:39,411] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +15: [2023-05-10 12:37:39,412] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... + 0: [2023-05-10 12:37:39,412] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +15: [2023-05-10 12:37:39,411] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +15: [2023-05-10 12:37:39,412] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +15: [2023-05-10 12:37:39,412] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +21: [2023-05-10 12:37:39,412] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... + 0: [2023-05-10 12:37:39,412] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... + 1: [2023-05-10 12:37:39,412] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. + 1: [2023-05-10 12:37:39,412] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +15: [2023-05-10 12:37:39,412] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +15: [2023-05-10 12:37:39,412] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +15: [2023-05-10 12:37:39,412] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt... +21: [2023-05-10 12:37:39,412] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +21: [2023-05-10 12:37:39,412] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +15: [2023-05-10 12:37:39,412] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +15: [2023-05-10 12:37:39,412] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +13: [2023-05-10 12:37:39,413] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +11: [2023-05-10 12:37:39,413] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... + 1: [2023-05-10 12:37:39,413] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. + 1: [2023-05-10 12:37:39,414] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +17: [2023-05-10 12:37:39,414] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +21: [2023-05-10 12:37:39,414] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +11: [2023-05-10 12:37:39,414] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +29: [2023-05-10 12:37:39,414] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +15: [2023-05-10 12:37:39,415] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +15: [2023-05-10 12:37:39,415] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +15: [2023-05-10 12:37:39,415] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt... +28: [2023-05-10 12:37:39,416] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +15: [2023-05-10 12:37:39,416] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +15: [2023-05-10 12:37:39,416] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt... +15: [2023-05-10 12:37:39,416] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt... +14: [2023-05-10 12:37:39,417] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +26: [2023-05-10 12:37:39,417] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... + 0: [2023-05-10 12:37:39,417] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. + 0: [2023-05-10 12:37:39,418] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +29: [2023-05-10 12:37:39,418] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +26: [2023-05-10 12:37:39,419] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +14: [2023-05-10 12:37:39,420] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +28: [2023-05-10 12:37:39,420] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +18: [2023-05-10 12:37:39,421] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +18: [2023-05-10 12:37:39,421] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +18: [2023-05-10 12:37:39,421] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +18: [2023-05-10 12:37:39,421] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +14: [2023-05-10 12:37:39,421] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +14: [2023-05-10 12:37:39,421] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +11: [2023-05-10 12:37:39,423] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +29: [2023-05-10 12:37:39,423] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +28: [2023-05-10 12:37:39,424] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +31: [2023-05-10 12:37:39,424] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +31: [2023-05-10 12:37:39,424] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +15: [2023-05-10 12:37:39,424] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +26: [2023-05-10 12:37:39,424] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +31: [2023-05-10 12:37:39,425] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +31: [2023-05-10 12:37:39,425] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. + 1: [2023-05-10 12:37:39,425] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... + 1: [2023-05-10 12:37:39,425] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +22: [2023-05-10 12:37:39,426] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +22: [2023-05-10 12:37:39,426] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. + 1: [2023-05-10 12:37:39,426] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +22: [2023-05-10 12:37:39,426] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +22: [2023-05-10 12:37:39,426] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... + 1: [2023-05-10 12:37:39,426] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +31: [2023-05-10 12:37:39,427] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +31: [2023-05-10 12:37:39,427] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +26: [2023-05-10 12:37:39,427] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +31: [2023-05-10 12:37:39,428] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... + 0: [2023-05-10 12:37:39,428] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +31: [2023-05-10 12:37:39,428] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +22: [2023-05-10 12:37:39,428] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +22: [2023-05-10 12:37:39,428] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +15: [2023-05-10 12:37:39,429] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +22: [2023-05-10 12:37:39,430] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +22: [2023-05-10 12:37:39,430] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +29: [2023-05-10 12:37:39,430] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +15: [2023-05-10 12:37:39,431] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. + 3: [2023-05-10 12:37:39,432] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +28: [2023-05-10 12:37:39,432] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. + 3: [2023-05-10 12:37:39,432] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +15: [2023-05-10 12:37:39,432] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. + 3: [2023-05-10 12:37:39,432] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. + 7: [2023-05-10 12:37:39,432] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt. + 3: [2023-05-10 12:37:39,432] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +28: [2023-05-10 12:37:39,433] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +26: [2023-05-10 12:37:39,433] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +18: [2023-05-10 12:37:39,433] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +26: [2023-05-10 12:37:39,433] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... + 3: [2023-05-10 12:37:39,434] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. + 3: [2023-05-10 12:37:39,434] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +29: [2023-05-10 12:37:39,434] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... + 7: [2023-05-10 12:37:39,434] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt. + 7: [2023-05-10 12:37:39,434] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt. + 7: [2023-05-10 12:37:39,435] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt. +18: [2023-05-10 12:37:39,434] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt. +15: [2023-05-10 12:37:39,435] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +18: [2023-05-10 12:37:39,435] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt. +22: [2023-05-10 12:37:39,435] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt. +25: [2023-05-10 12:37:39,435] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt. +22: [2023-05-10 12:37:39,435] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt. +22: [2023-05-10 12:37:39,435] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt. +25: [2023-05-10 12:37:39,435] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt. +25: [2023-05-10 12:37:39,435] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt. +22: [2023-05-10 12:37:39,436] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt. + 3: [2023-05-10 12:37:39,436] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... + 3: [2023-05-10 12:37:39,437] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +25: [2023-05-10 12:37:39,437] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt. +18: [2023-05-10 12:37:39,437] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +18: [2023-05-10 12:37:39,437] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +18: [2023-05-10 12:37:39,438] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +29: [2023-05-10 12:37:39,438] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt. +29: [2023-05-10 12:37:39,438] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt. +29: [2023-05-10 12:37:39,438] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt. +29: [2023-05-10 12:37:39,438] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt. +18: [2023-05-10 12:37:39,439] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt. +15: [2023-05-10 12:37:39,439] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +18: [2023-05-10 12:37:39,439] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt. +28: [2023-05-10 12:37:39,441] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +15: [2023-05-10 12:37:39,441] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +15: [2023-05-10 12:37:39,442] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +26: [2023-05-10 12:37:39,442] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... + 4: [2023-05-10 12:37:39,442] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt. + 4: [2023-05-10 12:37:39,443] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt. + 7: [2023-05-10 12:37:39,443] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... + 3: [2023-05-10 12:37:39,443] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. + 7: [2023-05-10 12:37:39,444] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... + 7: [2023-05-10 12:37:39,444] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... + 7: [2023-05-10 12:37:39,445] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... + 4: [2023-05-10 12:37:39,445] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt. + 4: [2023-05-10 12:37:39,446] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt. +22: [2023-05-10 12:37:39,446] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +22: [2023-05-10 12:37:39,446] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +18: [2023-05-10 12:37:39,446] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +18: [2023-05-10 12:37:39,446] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +22: [2023-05-10 12:37:39,447] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +22: [2023-05-10 12:37:39,447] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +25: [2023-05-10 12:37:39,448] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +29: [2023-05-10 12:37:39,449] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +22: [2023-05-10 12:37:39,449] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +29: [2023-05-10 12:37:39,449] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +22: [2023-05-10 12:37:39,449] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... + 3: [2023-05-10 12:37:39,450] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +29: [2023-05-10 12:37:39,450] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +25: [2023-05-10 12:37:39,450] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +29: [2023-05-10 12:37:39,450] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +18: [2023-05-10 12:37:39,451] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +18: [2023-05-10 12:37:39,451] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +25: [2023-05-10 12:37:39,451] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... + 4: [2023-05-10 12:37:39,452] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +25: [2023-05-10 12:37:39,453] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... + 4: [2023-05-10 12:37:39,454] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... + 4: [2023-05-10 12:37:39,455] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... + 4: [2023-05-10 12:37:39,455] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... + 3: [2023-05-10 12:37:39,455] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... + 7: [2023-05-10 12:37:39,455] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. + 7: [2023-05-10 12:37:39,456] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt... +31: [2023-05-10 12:37:39,456] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +31: [2023-05-10 12:37:39,456] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +31: [2023-05-10 12:37:39,457] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +31: [2023-05-10 12:37:39,458] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +22: [2023-05-10 12:37:39,458] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... + 9: [2023-05-10 12:37:39,460] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt. + 2: [2023-05-10 12:37:39,460] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt. +25: [2023-05-10 12:37:39,460] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +22: [2023-05-10 12:37:39,461] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +22: [2023-05-10 12:37:39,461] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +25: [2023-05-10 12:37:39,461] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt... + 2: [2023-05-10 12:37:39,461] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt. +28: [2023-05-10 12:37:39,461] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt. +28: [2023-05-10 12:37:39,462] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt. +28: [2023-05-10 12:37:39,462] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt. +22: [2023-05-10 12:37:39,462] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt... +28: [2023-05-10 12:37:39,462] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt. +23: [2023-05-10 12:37:39,462] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt. + 1: [2023-05-10 12:37:39,462] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt. + 3: [2023-05-10 12:37:39,462] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +18: [2023-05-10 12:37:39,462] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +18: [2023-05-10 12:37:39,462] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. + 2: [2023-05-10 12:37:39,463] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt. +22: [2023-05-10 12:37:39,463] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. + 9: [2023-05-10 12:37:39,463] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt. +18: [2023-05-10 12:37:39,463] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt... +18: [2023-05-10 12:37:39,463] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt... + 2: [2023-05-10 12:37:39,463] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt. + 8: [2023-05-10 12:37:39,463] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt. + 8: [2023-05-10 12:37:39,463] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt. +23: [2023-05-10 12:37:39,463] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt. + 8: [2023-05-10 12:37:39,463] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt. + 8: [2023-05-10 12:37:39,464] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt. + 1: [2023-05-10 12:37:39,464] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt. +25: [2023-05-10 12:37:39,464] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +25: [2023-05-10 12:37:39,464] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt... + 9: [2023-05-10 12:37:39,464] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt. +23: [2023-05-10 12:37:39,464] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt. +23: [2023-05-10 12:37:39,465] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt. +22: [2023-05-10 12:37:39,464] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +22: [2023-05-10 12:37:39,465] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt... +29: [2023-05-10 12:37:39,465] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +29: [2023-05-10 12:37:39,465] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +25: [2023-05-10 12:37:39,465] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. + 7: [2023-05-10 12:37:39,465] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. + 7: [2023-05-10 12:37:39,465] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +25: [2023-05-10 12:37:39,465] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt... + 7: [2023-05-10 12:37:39,465] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt... + 7: [2023-05-10 12:37:39,465] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt... +29: [2023-05-10 12:37:39,465] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +29: [2023-05-10 12:37:39,465] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +22: [2023-05-10 12:37:39,466] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. + 5: [2023-05-10 12:37:39,466] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt. +29: [2023-05-10 12:37:39,466] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt... +29: [2023-05-10 12:37:39,466] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt... +19: [2023-05-10 12:37:39,466] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt. + 9: [2023-05-10 12:37:39,466] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt. +29: [2023-05-10 12:37:39,466] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt... +29: [2023-05-10 12:37:39,466] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt... +19: [2023-05-10 12:37:39,466] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +19: [2023-05-10 12:37:39,466] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt. +19: [2023-05-10 12:37:39,466] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +19: [2023-05-10 12:37:39,466] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +19: [2023-05-10 12:37:39,466] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt. +19: [2023-05-10 12:37:39,466] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +19: [2023-05-10 12:37:39,466] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... + 5: [2023-05-10 12:37:39,466] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt. +19: [2023-05-10 12:37:39,466] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... + 1: [2023-05-10 12:37:39,465] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt. +19: [2023-05-10 12:37:39,466] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +19: [2023-05-10 12:37:39,466] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt. +19: [2023-05-10 12:37:39,467] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... + 1: [2023-05-10 12:37:39,467] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt. + 3: [2023-05-10 12:37:39,467] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt. + 3: [2023-05-10 12:37:39,467] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt. + 3: [2023-05-10 12:37:39,467] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt. +18: [2023-05-10 12:37:39,467] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +18: [2023-05-10 12:37:39,467] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +18: [2023-05-10 12:37:39,467] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt... +18: [2023-05-10 12:37:39,467] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt... +20: [2023-05-10 12:37:39,466] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt. +20: [2023-05-10 12:37:39,466] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt. +20: [2023-05-10 12:37:39,466] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt. +27: [2023-05-10 12:37:39,467] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt. +27: [2023-05-10 12:37:39,467] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt. + 3: [2023-05-10 12:37:39,467] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt. +20: [2023-05-10 12:37:39,468] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt. + 4: [2023-05-10 12:37:39,468] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. + 7: [2023-05-10 12:37:39,468] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. + 4: [2023-05-10 12:37:39,469] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt... +31: [2023-05-10 12:37:39,469] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... + 5: [2023-05-10 12:37:39,469] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt. +31: [2023-05-10 12:37:39,469] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... + 7: [2023-05-10 12:37:39,470] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt... +25: [2023-05-10 12:37:39,470] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +25: [2023-05-10 12:37:39,470] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt... + 9: [2023-05-10 12:37:39,470] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +27: [2023-05-10 12:37:39,470] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt. + 4: [2023-05-10 12:37:39,470] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. + 4: [2023-05-10 12:37:39,470] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +27: [2023-05-10 12:37:39,470] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt. + 2: [2023-05-10 12:37:39,470] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +31: [2023-05-10 12:37:39,470] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +31: [2023-05-10 12:37:39,471] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... + 3: [2023-05-10 12:37:39,470] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. + 4: [2023-05-10 12:37:39,470] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt... + 4: [2023-05-10 12:37:39,470] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt... +23: [2023-05-10 12:37:39,471] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. + 5: [2023-05-10 12:37:39,471] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt. +23: [2023-05-10 12:37:39,471] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +23: [2023-05-10 12:37:39,472] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +23: [2023-05-10 12:37:39,472] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... + 2: [2023-05-10 12:37:39,472] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +23: [2023-05-10 12:37:39,472] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. + 3: [2023-05-10 12:37:39,473] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. + 2: [2023-05-10 12:37:39,473] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +23: [2023-05-10 12:37:39,473] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +28: [2023-05-10 12:37:39,473] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... + 2: [2023-05-10 12:37:39,473] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... + 9: [2023-05-10 12:37:39,473] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... + 8: [2023-05-10 12:37:39,473] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... + 8: [2023-05-10 12:37:39,473] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +22: [2023-05-10 12:37:39,473] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... + 1: [2023-05-10 12:37:39,474] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +23: [2023-05-10 12:37:39,474] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... + 9: [2023-05-10 12:37:39,474] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... + 8: [2023-05-10 12:37:39,474] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... + 8: [2023-05-10 12:37:39,474] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +28: [2023-05-10 12:37:39,474] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +23: [2023-05-10 12:37:39,474] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +23: [2023-05-10 12:37:39,475] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +23: [2023-05-10 12:37:39,475] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... + 4: [2023-05-10 12:37:39,475] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. + 4: [2023-05-10 12:37:39,475] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt... +28: [2023-05-10 12:37:39,475] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +22: [2023-05-10 12:37:39,475] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... + 1: [2023-05-10 12:37:39,475] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +28: [2023-05-10 12:37:39,476] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... + 5: [2023-05-10 12:37:39,476] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... + 5: [2023-05-10 12:37:39,476] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... + 0: [2023-05-10 12:37:39,476] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt. + 0: [2023-05-10 12:37:39,476] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt. +23: [2023-05-10 12:37:39,477] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. + 9: [2023-05-10 12:37:39,477] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... + 1: [2023-05-10 12:37:39,477] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... + 0: [2023-05-10 12:37:39,477] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt. + 1: [2023-05-10 12:37:39,477] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... + 0: [2023-05-10 12:37:39,477] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt. +19: [2023-05-10 12:37:39,478] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +27: [2023-05-10 12:37:39,478] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +21: [2023-05-10 12:37:39,478] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt. + 3: [2023-05-10 12:37:39,478] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... + 3: [2023-05-10 12:37:39,478] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +21: [2023-05-10 12:37:39,478] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt. +30: [2023-05-10 12:37:39,478] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt. +30: [2023-05-10 12:37:39,479] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt. +19: [2023-05-10 12:37:39,479] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +13: [2023-05-10 12:37:39,479] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt. +30: [2023-05-10 12:37:39,479] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt. +13: [2023-05-10 12:37:39,479] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt. +30: [2023-05-10 12:37:39,479] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt. +19: [2023-05-10 12:37:39,479] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... + 3: [2023-05-10 12:37:39,479] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +21: [2023-05-10 12:37:39,479] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt. +21: [2023-05-10 12:37:39,479] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt. +20: [2023-05-10 12:37:39,479] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +13: [2023-05-10 12:37:39,480] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt. +13: [2023-05-10 12:37:39,480] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_06-model_01-model_states.pt. +23: [2023-05-10 12:37:39,480] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +20: [2023-05-10 12:37:39,481] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +27: [2023-05-10 12:37:39,481] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... + 5: [2023-05-10 12:37:39,481] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +22: [2023-05-10 12:37:39,482] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +20: [2023-05-10 12:37:39,482] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +19: [2023-05-10 12:37:39,482] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... + 3: [2023-05-10 12:37:39,482] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +19: [2023-05-10 12:37:39,482] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. + 3: [2023-05-10 12:37:39,483] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +22: [2023-05-10 12:37:39,483] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +26: [2023-05-10 12:37:39,484] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt. +26: [2023-05-10 12:37:39,484] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt. +26: [2023-05-10 12:37:39,484] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt. +26: [2023-05-10 12:37:39,484] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt. + 3: [2023-05-10 12:37:39,484] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +27: [2023-05-10 12:37:39,484] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +27: [2023-05-10 12:37:39,484] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +22: [2023-05-10 12:37:39,484] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt... +23: [2023-05-10 12:37:39,484] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +22: [2023-05-10 12:37:39,485] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt... +20: [2023-05-10 12:37:39,485] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... + 5: [2023-05-10 12:37:39,486] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... + 0: [2023-05-10 12:37:39,486] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... + 9: [2023-05-10 12:37:39,487] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +28: [2023-05-10 12:37:39,488] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +19: [2023-05-10 12:37:39,488] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +19: [2023-05-10 12:37:39,488] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +28: [2023-05-10 12:37:39,488] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +28: [2023-05-10 12:37:39,488] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. + 0: [2023-05-10 12:37:39,488] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... + 0: [2023-05-10 12:37:39,488] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +30: [2023-05-10 12:37:39,488] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... + 9: [2023-05-10 12:37:39,488] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt... + 0: [2023-05-10 12:37:39,488] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +28: [2023-05-10 12:37:39,488] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt... +28: [2023-05-10 12:37:39,488] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt... +28: [2023-05-10 12:37:39,488] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt... + 2: [2023-05-10 12:37:39,488] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. + 2: [2023-05-10 12:37:39,489] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt... + 9: [2023-05-10 12:37:39,489] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +23: [2023-05-10 12:37:39,489] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. + 9: [2023-05-10 12:37:39,490] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt... + 2: [2023-05-10 12:37:39,490] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. + 2: [2023-05-10 12:37:39,490] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. + 2: [2023-05-10 12:37:39,490] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt... + 2: [2023-05-10 12:37:39,490] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt... +13: [2023-05-10 12:37:39,490] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +30: [2023-05-10 12:37:39,490] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +21: [2023-05-10 12:37:39,491] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... + 2: [2023-05-10 12:37:39,491] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. + 2: [2023-05-10 12:37:39,491] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt... +21: [2023-05-10 12:37:39,491] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +30: [2023-05-10 12:37:39,491] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +13: [2023-05-10 12:37:39,492] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +13: [2023-05-10 12:37:39,492] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +13: [2023-05-10 12:37:39,492] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +27: [2023-05-10 12:37:39,492] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. + 8: [2023-05-10 12:37:39,492] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +21: [2023-05-10 12:37:39,493] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... + 8: [2023-05-10 12:37:39,493] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt... +19: [2023-05-10 12:37:39,493] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +27: [2023-05-10 12:37:39,493] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +30: [2023-05-10 12:37:39,493] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +21: [2023-05-10 12:37:39,494] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt... +27: [2023-05-10 12:37:39,494] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt... +27: [2023-05-10 12:37:39,494] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt... +23: [2023-05-10 12:37:39,494] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. + 1: [2023-05-10 12:37:39,494] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. + 1: [2023-05-10 12:37:39,494] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt... + 5: [2023-05-10 12:37:39,494] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. + 3: [2023-05-10 12:37:39,495] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. + 5: [2023-05-10 12:37:39,495] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt... + 3: [2023-05-10 12:37:39,495] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt... + 1: [2023-05-10 12:37:39,495] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. + 1: [2023-05-10 12:37:39,495] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt... +23: [2023-05-10 12:37:39,495] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... + 1: [2023-05-10 12:37:39,495] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. + 1: [2023-05-10 12:37:39,495] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt... + 8: [2023-05-10 12:37:39,496] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. + 8: [2023-05-10 12:37:39,496] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. + 8: [2023-05-10 12:37:39,496] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt... + 8: [2023-05-10 12:37:39,496] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt... + 3: [2023-05-10 12:37:39,496] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. + 3: [2023-05-10 12:37:39,496] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt... + 3: [2023-05-10 12:37:39,496] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. + 3: [2023-05-10 12:37:39,496] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. + 3: [2023-05-10 12:37:39,496] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt... + 3: [2023-05-10 12:37:39,496] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt... + 9: [2023-05-10 12:37:39,496] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. + 9: [2023-05-10 12:37:39,496] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt... + 1: [2023-05-10 12:37:39,497] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +19: [2023-05-10 12:37:39,497] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. + 1: [2023-05-10 12:37:39,497] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt... +26: [2023-05-10 12:37:39,497] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... + 5: [2023-05-10 12:37:39,497] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +26: [2023-05-10 12:37:39,497] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +26: [2023-05-10 12:37:39,497] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... + 5: [2023-05-10 12:37:39,497] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt... +19: [2023-05-10 12:37:39,497] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt... + 0: [2023-05-10 12:37:39,498] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. + 8: [2023-05-10 12:37:39,498] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. + 8: [2023-05-10 12:37:39,498] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt... +19: [2023-05-10 12:37:39,498] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. + 0: [2023-05-10 12:37:39,498] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt... +23: [2023-05-10 12:37:39,498] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +23: [2023-05-10 12:37:39,498] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +19: [2023-05-10 12:37:39,499] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +19: [2023-05-10 12:37:39,499] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +19: [2023-05-10 12:37:39,499] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +19: [2023-05-10 12:37:39,499] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt... +23: [2023-05-10 12:37:39,499] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... + 9: [2023-05-10 12:37:39,499] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. + 9: [2023-05-10 12:37:39,499] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt... +26: [2023-05-10 12:37:39,500] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +27: [2023-05-10 12:37:39,500] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +27: [2023-05-10 12:37:39,500] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt... + 4: [2023-05-10 12:37:39,500] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. + 4: [2023-05-10 12:37:39,500] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. + 4: [2023-05-10 12:37:39,500] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. + 4: [2023-05-10 12:37:39,500] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... + 4: [2023-05-10 12:37:39,500] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... + 4: [2023-05-10 12:37:39,500] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... + 4: [2023-05-10 12:37:39,500] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +23: [2023-05-10 12:37:39,501] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt... +23: [2023-05-10 12:37:39,501] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt... +28: [2023-05-10 12:37:39,502] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +23: [2023-05-10 12:37:39,502] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +23: [2023-05-10 12:37:39,502] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +23: [2023-05-10 12:37:39,502] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt... +23: [2023-05-10 12:37:39,502] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt... + 4: [2023-05-10 12:37:39,503] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +30: [2023-05-10 12:37:39,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +30: [2023-05-10 12:37:39,503] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +30: [2023-05-10 12:37:39,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. + 5: [2023-05-10 12:37:39,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. + 5: [2023-05-10 12:37:39,503] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt... + 5: [2023-05-10 12:37:39,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. + 5: [2023-05-10 12:37:39,504] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt... +30: [2023-05-10 12:37:39,504] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +30: [2023-05-10 12:37:39,504] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +30: [2023-05-10 12:37:39,504] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +28: [2023-05-10 12:37:39,504] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt... +23: [2023-05-10 12:37:39,505] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +27: [2023-05-10 12:37:39,505] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +27: [2023-05-10 12:37:39,505] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt... +30: [2023-05-10 12:37:39,505] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +13: [2023-05-10 12:37:39,505] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +30: [2023-05-10 12:37:39,505] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +13: [2023-05-10 12:37:39,506] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt... +30: [2023-05-10 12:37:39,506] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... + 0: [2023-05-10 12:37:39,506] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +30: [2023-05-10 12:37:39,506] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt... +20: [2023-05-10 12:37:39,506] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. + 0: [2023-05-10 12:37:39,506] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt... +21: [2023-05-10 12:37:39,506] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +21: [2023-05-10 12:37:39,507] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +20: [2023-05-10 12:37:39,507] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +21: [2023-05-10 12:37:39,507] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt... +13: [2023-05-10 12:37:39,507] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +21: [2023-05-10 12:37:39,507] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt... +13: [2023-05-10 12:37:39,507] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt... +21: [2023-05-10 12:37:39,507] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +21: [2023-05-10 12:37:39,508] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt... +20: [2023-05-10 12:37:39,508] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +19: [2023-05-10 12:37:39,508] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +20: [2023-05-10 12:37:39,508] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt... +30: [2023-05-10 12:37:39,509] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +30: [2023-05-10 12:37:39,509] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt... +20: [2023-05-10 12:37:39,509] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt... +20: [2023-05-10 12:37:39,510] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt... + 0: [2023-05-10 12:37:39,512] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. + 0: [2023-05-10 12:37:39,512] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. + 0: [2023-05-10 12:37:39,512] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt... + 0: [2023-05-10 12:37:39,512] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt... +13: [2023-05-10 12:37:39,512] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +13: [2023-05-10 12:37:39,512] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt... +21: [2023-05-10 12:37:39,512] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. + 4: [2023-05-10 12:37:39,512] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +21: [2023-05-10 12:37:39,513] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt... +13: [2023-05-10 12:37:39,513] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_00-model_states.pt. +13: [2023-05-10 12:37:39,513] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt... +20: [2023-05-10 12:37:39,513] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +19: [2023-05-10 12:37:39,514] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. + 4: [2023-05-10 12:37:39,515] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +19: [2023-05-10 12:37:39,516] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt... +20: [2023-05-10 12:37:39,516] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt... +19: [2023-05-10 12:37:39,517] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. + 4: [2023-05-10 12:37:39,517] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +30: [2023-05-10 12:37:39,518] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +19: [2023-05-10 12:37:39,519] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt... +30: [2023-05-10 12:37:39,520] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +23: [2023-05-10 12:37:39,520] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. + 4: [2023-05-10 12:37:39,521] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +30: [2023-05-10 12:37:39,521] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +30: [2023-05-10 12:37:39,522] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt... +30: [2023-05-10 12:37:39,523] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. + 6: [2023-05-10 12:37:39,524] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. + 6: [2023-05-10 12:37:39,524] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. + 6: [2023-05-10 12:37:39,524] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... + 6: [2023-05-10 12:37:39,524] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... + 6: [2023-05-10 12:37:39,524] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. + 6: [2023-05-10 12:37:39,524] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +26: [2023-05-10 12:37:39,524] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. + 6: [2023-05-10 12:37:39,524] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +30: [2023-05-10 12:37:39,525] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt... + 6: [2023-05-10 12:37:39,526] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +16: [2023-05-10 12:37:39,527] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +16: [2023-05-10 12:37:39,527] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +16: [2023-05-10 12:37:39,527] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +16: [2023-05-10 12:37:39,527] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +26: [2023-05-10 12:37:39,527] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt... +16: [2023-05-10 12:37:39,527] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +16: [2023-05-10 12:37:39,527] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +16: [2023-05-10 12:37:39,527] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +26: [2023-05-10 12:37:39,528] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. + 4: [2023-05-10 12:37:39,528] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +26: [2023-05-10 12:37:39,529] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +26: [2023-05-10 12:37:39,529] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +23: [2023-05-10 12:37:39,529] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +26: [2023-05-10 12:37:39,529] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt... +16: [2023-05-10 12:37:39,529] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... + 4: [2023-05-10 12:37:39,531] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +26: [2023-05-10 12:37:39,531] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt... +26: [2023-05-10 12:37:39,531] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt... +30: [2023-05-10 12:37:39,531] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +30: [2023-05-10 12:37:39,531] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +12: [2023-05-10 12:37:39,533] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +12: [2023-05-10 12:37:39,533] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +12: [2023-05-10 12:37:39,533] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +12: [2023-05-10 12:37:39,533] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +12: [2023-05-10 12:37:39,533] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +12: [2023-05-10 12:37:39,533] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +30: [2023-05-10 12:37:39,534] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +12: [2023-05-10 12:37:39,535] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +12: [2023-05-10 12:37:39,536] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... + 6: [2023-05-10 12:37:39,536] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. + 4: [2023-05-10 12:37:39,537] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. + 8: [2023-05-10 12:37:39,538] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. + 8: [2023-05-10 12:37:39,539] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... + 8: [2023-05-10 12:37:39,539] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. + 8: [2023-05-10 12:37:39,539] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. + 8: [2023-05-10 12:37:39,539] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... + 8: [2023-05-10 12:37:39,539] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... + 8: [2023-05-10 12:37:39,539] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. + 8: [2023-05-10 12:37:39,539] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... + 6: [2023-05-10 12:37:39,540] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. + 6: [2023-05-10 12:37:39,540] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +31: [2023-05-10 12:37:39,540] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt. +31: [2023-05-10 12:37:39,541] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt. +31: [2023-05-10 12:37:39,541] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt. +31: [2023-05-10 12:37:39,541] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt. +16: [2023-05-10 12:37:39,541] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +30: [2023-05-10 12:37:39,542] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +16: [2023-05-10 12:37:39,543] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +16: [2023-05-10 12:37:39,543] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +30: [2023-05-10 12:37:39,543] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +12: [2023-05-10 12:37:39,546] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. + 4: [2023-05-10 12:37:39,547] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +12: [2023-05-10 12:37:39,547] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. + 6: [2023-05-10 12:37:39,548] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... + 6: [2023-05-10 12:37:39,549] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... + 6: [2023-05-10 12:37:39,549] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... + 8: [2023-05-10 12:37:39,550] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +30: [2023-05-10 12:37:39,551] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +16: [2023-05-10 12:37:39,552] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +31: [2023-05-10 12:37:39,553] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +31: [2023-05-10 12:37:39,553] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +31: [2023-05-10 12:37:39,553] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +31: [2023-05-10 12:37:39,554] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +16: [2023-05-10 12:37:39,555] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +16: [2023-05-10 12:37:39,555] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +24: [2023-05-10 12:37:39,557] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +24: [2023-05-10 12:37:39,557] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... + 6: [2023-05-10 12:37:39,557] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. + 8: [2023-05-10 12:37:39,558] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. + 8: [2023-05-10 12:37:39,558] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +24: [2023-05-10 12:37:39,558] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +12: [2023-05-10 12:37:39,558] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +16: [2023-05-10 12:37:39,559] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +24: [2023-05-10 12:37:39,560] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... + 8: [2023-05-10 12:37:39,560] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +12: [2023-05-10 12:37:39,561] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +24: [2023-05-10 12:37:39,563] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +24: [2023-05-10 12:37:39,563] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. + 8: [2023-05-10 12:37:39,564] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +24: [2023-05-10 12:37:39,564] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +24: [2023-05-10 12:37:39,565] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +12: [2023-05-10 12:37:39,566] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. + 6: [2023-05-10 12:37:39,567] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... + 8: [2023-05-10 12:37:39,568] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... + 8: [2023-05-10 12:37:39,568] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +12: [2023-05-10 12:37:39,569] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +16: [2023-05-10 12:37:39,570] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +24: [2023-05-10 12:37:39,570] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +31: [2023-05-10 12:37:39,570] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +31: [2023-05-10 12:37:39,571] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt... +31: [2023-05-10 12:37:39,571] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +31: [2023-05-10 12:37:39,571] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt... +17: [2023-05-10 12:37:39,573] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +17: [2023-05-10 12:37:39,573] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +17: [2023-05-10 12:37:39,573] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +17: [2023-05-10 12:37:39,573] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... + 8: [2023-05-10 12:37:39,574] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +12: [2023-05-10 12:37:39,575] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +12: [2023-05-10 12:37:39,575] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt. +12: [2023-05-10 12:37:39,575] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt. +12: [2023-05-10 12:37:39,575] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt. +12: [2023-05-10 12:37:39,575] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt. +10: [2023-05-10 12:37:39,576] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt. +10: [2023-05-10 12:37:39,576] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt. +10: [2023-05-10 12:37:39,576] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt. +10: [2023-05-10 12:37:39,576] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt. +31: [2023-05-10 12:37:39,576] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +31: [2023-05-10 12:37:39,576] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt... + 6: [2023-05-10 12:37:39,575] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt. + 6: [2023-05-10 12:37:39,576] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt. + 6: [2023-05-10 12:37:39,576] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt. + 6: [2023-05-10 12:37:39,576] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt. +17: [2023-05-10 12:37:39,577] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +17: [2023-05-10 12:37:39,577] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +17: [2023-05-10 12:37:39,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +12: [2023-05-10 12:37:39,579] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +17: [2023-05-10 12:37:39,580] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +24: [2023-05-10 12:37:39,580] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +31: [2023-05-10 12:37:39,582] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +12: [2023-05-10 12:37:39,584] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... + 6: [2023-05-10 12:37:39,585] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... + 6: [2023-05-10 12:37:39,585] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +12: [2023-05-10 12:37:39,585] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +11: [2023-05-10 12:37:39,585] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt. +11: [2023-05-10 12:37:39,585] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt. +11: [2023-05-10 12:37:39,586] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt. +24: [2023-05-10 12:37:39,586] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt. +24: [2023-05-10 12:37:39,586] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt. +31: [2023-05-10 12:37:39,586] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt... +24: [2023-05-10 12:37:39,586] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt. +11: [2023-05-10 12:37:39,586] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt. +24: [2023-05-10 12:37:39,587] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt. +12: [2023-05-10 12:37:39,587] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +10: [2023-05-10 12:37:39,587] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... + 6: [2023-05-10 12:37:39,588] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... + 6: [2023-05-10 12:37:39,589] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +12: [2023-05-10 12:37:39,589] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +17: [2023-05-10 12:37:39,590] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +17: [2023-05-10 12:37:39,590] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +24: [2023-05-10 12:37:39,590] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +10: [2023-05-10 12:37:39,590] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +10: [2023-05-10 12:37:39,594] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +10: [2023-05-10 12:37:39,595] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +12: [2023-05-10 12:37:39,596] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +24: [2023-05-10 12:37:39,597] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +11: [2023-05-10 12:37:39,597] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +12: [2023-05-10 12:37:39,597] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt... +24: [2023-05-10 12:37:39,598] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +24: [2023-05-10 12:37:39,598] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +12: [2023-05-10 12:37:39,598] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +12: [2023-05-10 12:37:39,599] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt... +24: [2023-05-10 12:37:39,599] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +17: [2023-05-10 12:37:39,599] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt. +17: [2023-05-10 12:37:39,599] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt. +11: [2023-05-10 12:37:39,599] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +24: [2023-05-10 12:37:39,599] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +17: [2023-05-10 12:37:39,600] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt. +24: [2023-05-10 12:37:39,600] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +17: [2023-05-10 12:37:39,600] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +17: [2023-05-10 12:37:39,600] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt. +17: [2023-05-10 12:37:39,600] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +27: [2023-05-10 12:37:39,600] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +27: [2023-05-10 12:37:39,600] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... + 7: [2023-05-10 12:37:39,600] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. + 7: [2023-05-10 12:37:39,600] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +27: [2023-05-10 12:37:39,600] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +27: [2023-05-10 12:37:39,600] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. + 7: [2023-05-10 12:37:39,600] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +27: [2023-05-10 12:37:39,600] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... + 7: [2023-05-10 12:37:39,600] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +27: [2023-05-10 12:37:39,600] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... + 6: [2023-05-10 12:37:39,600] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. + 6: [2023-05-10 12:37:39,601] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt... + 6: [2023-05-10 12:37:39,601] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. + 2: [2023-05-10 12:37:39,601] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. + 6: [2023-05-10 12:37:39,602] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt... + 2: [2023-05-10 12:37:39,601] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. + 2: [2023-05-10 12:37:39,601] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... + 2: [2023-05-10 12:37:39,602] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +24: [2023-05-10 12:37:39,602] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +11: [2023-05-10 12:37:39,602] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... + 6: [2023-05-10 12:37:39,602] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. + 6: [2023-05-10 12:37:39,602] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt... +27: [2023-05-10 12:37:39,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +11: [2023-05-10 12:37:39,604] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... + 5: [2023-05-10 12:37:39,604] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. + 5: [2023-05-10 12:37:39,605] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +10: [2023-05-10 12:37:39,604] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. + 5: [2023-05-10 12:37:39,605] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +10: [2023-05-10 12:37:39,605] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... + 7: [2023-05-10 12:37:39,605] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. + 5: [2023-05-10 12:37:39,605] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +10: [2023-05-10 12:37:39,605] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. + 2: [2023-05-10 12:37:39,605] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +10: [2023-05-10 12:37:39,605] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +10: [2023-05-10 12:37:39,605] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt... +27: [2023-05-10 12:37:39,605] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... + 2: [2023-05-10 12:37:39,605] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +10: [2023-05-10 12:37:39,605] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt... + 7: [2023-05-10 12:37:39,605] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. + 5: [2023-05-10 12:37:39,606] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. + 5: [2023-05-10 12:37:39,606] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. + 7: [2023-05-10 12:37:39,607] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +17: [2023-05-10 12:37:39,607] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. + 2: [2023-05-10 12:37:39,607] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +10: [2023-05-10 12:37:39,607] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +10: [2023-05-10 12:37:39,607] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +10: [2023-05-10 12:37:39,607] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. + 2: [2023-05-10 12:37:39,608] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... + 5: [2023-05-10 12:37:39,608] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... + 5: [2023-05-10 12:37:39,608] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... + 7: [2023-05-10 12:37:39,608] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +16: [2023-05-10 12:37:39,609] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt. +16: [2023-05-10 12:37:39,609] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt. +16: [2023-05-10 12:37:39,609] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt. +16: [2023-05-10 12:37:39,609] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt. +24: [2023-05-10 12:37:39,610] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +17: [2023-05-10 12:37:39,610] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +17: [2023-05-10 12:37:39,610] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +10: [2023-05-10 12:37:39,610] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +17: [2023-05-10 12:37:39,611] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +10: [2023-05-10 12:37:39,611] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +24: [2023-05-10 12:37:39,611] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +17: [2023-05-10 12:37:39,611] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +10: [2023-05-10 12:37:39,611] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +27: [2023-05-10 12:37:39,612] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. + 2: [2023-05-10 12:37:39,613] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +14: [2023-05-10 12:37:39,614] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt. +14: [2023-05-10 12:37:39,614] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt. +14: [2023-05-10 12:37:39,614] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt. +12: [2023-05-10 12:37:39,614] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +14: [2023-05-10 12:37:39,614] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt. +27: [2023-05-10 12:37:39,614] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +24: [2023-05-10 12:37:39,613] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +27: [2023-05-10 12:37:39,614] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +24: [2023-05-10 12:37:39,615] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +24: [2023-05-10 12:37:39,615] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt... + 2: [2023-05-10 12:37:39,615] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +12: [2023-05-10 12:37:39,615] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +24: [2023-05-10 12:37:39,615] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt... +12: [2023-05-10 12:37:39,615] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt... +17: [2023-05-10 12:37:39,616] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +17: [2023-05-10 12:37:39,616] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... + 6: [2023-05-10 12:37:39,617] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. + 5: [2023-05-10 12:37:39,617] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +12: [2023-05-10 12:37:39,617] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt... + 5: [2023-05-10 12:37:39,618] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. + 7: [2023-05-10 12:37:39,618] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt. + 7: [2023-05-10 12:37:39,618] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt. + 7: [2023-05-10 12:37:39,618] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +10: [2023-05-10 12:37:39,618] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. + 7: [2023-05-10 12:37:39,619] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt. + 7: [2023-05-10 12:37:39,619] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt. + 6: [2023-05-10 12:37:39,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt... + 7: [2023-05-10 12:37:39,620] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +16: [2023-05-10 12:37:39,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +24: [2023-05-10 12:37:39,621] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +16: [2023-05-10 12:37:39,621] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... + 2: [2023-05-10 12:37:39,622] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +24: [2023-05-10 12:37:39,621] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt... +27: [2023-05-10 12:37:39,622] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... + 9: [2023-05-10 12:37:39,622] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt. + 9: [2023-05-10 12:37:39,622] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt. + 9: [2023-05-10 12:37:39,622] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt. + 9: [2023-05-10 12:37:39,622] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt. +16: [2023-05-10 12:37:39,623] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +16: [2023-05-10 12:37:39,624] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... + 2: [2023-05-10 12:37:39,625] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +17: [2023-05-10 12:37:39,625] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +10: [2023-05-10 12:37:39,626] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +27: [2023-05-10 12:37:39,626] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +10: [2023-05-10 12:37:39,626] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +17: [2023-05-10 12:37:39,627] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt... +17: [2023-05-10 12:37:39,627] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +27: [2023-05-10 12:37:39,627] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +10: [2023-05-10 12:37:39,628] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt... +14: [2023-05-10 12:37:39,628] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... + 7: [2023-05-10 12:37:39,629] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +14: [2023-05-10 12:37:39,629] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... + 7: [2023-05-10 12:37:39,629] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... + 7: [2023-05-10 12:37:39,629] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +10: [2023-05-10 12:37:39,630] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt... + 5: [2023-05-10 12:37:39,630] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... + 7: [2023-05-10 12:37:39,630] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +10: [2023-05-10 12:37:39,630] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +14: [2023-05-10 12:37:39,630] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... + 5: [2023-05-10 12:37:39,630] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +14: [2023-05-10 12:37:39,630] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... + 7: [2023-05-10 12:37:39,631] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +17: [2023-05-10 12:37:39,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +17: [2023-05-10 12:37:39,631] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt... +17: [2023-05-10 12:37:39,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +17: [2023-05-10 12:37:39,631] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt... + 9: [2023-05-10 12:37:39,631] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... + 9: [2023-05-10 12:37:39,633] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... + 7: [2023-05-10 12:37:39,633] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... + 9: [2023-05-10 12:37:39,633] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... + 2: [2023-05-10 12:37:39,634] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +24: [2023-05-10 12:37:39,634] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +25: [2023-05-10 12:37:39,636] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +25: [2023-05-10 12:37:39,636] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +25: [2023-05-10 12:37:39,636] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +16: [2023-05-10 12:37:39,636] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +16: [2023-05-10 12:37:39,636] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +27: [2023-05-10 12:37:39,637] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +16: [2023-05-10 12:37:39,637] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt... +16: [2023-05-10 12:37:39,637] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt... +24: [2023-05-10 12:37:39,637] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt... + 9: [2023-05-10 12:37:39,637] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... + 2: [2023-05-10 12:37:39,638] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +25: [2023-05-10 12:37:39,638] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +25: [2023-05-10 12:37:39,638] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +15: [2023-05-10 12:37:39,639] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +15: [2023-05-10 12:37:39,639] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... + 5: [2023-05-10 12:37:39,639] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +25: [2023-05-10 12:37:39,639] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +15: [2023-05-10 12:37:39,639] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +15: [2023-05-10 12:37:39,639] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +10: [2023-05-10 12:37:39,639] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +15: [2023-05-10 12:37:39,640] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +15: [2023-05-10 12:37:39,640] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +15: [2023-05-10 12:37:39,640] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +25: [2023-05-10 12:37:39,641] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +25: [2023-05-10 12:37:39,641] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +15: [2023-05-10 12:37:39,641] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... + 5: [2023-05-10 12:37:39,643] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +13: [2023-05-10 12:37:39,643] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +13: [2023-05-10 12:37:39,643] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +17: [2023-05-10 12:37:39,643] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. + 2: [2023-05-10 12:37:39,643] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +13: [2023-05-10 12:37:39,644] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. + 7: [2023-05-10 12:37:39,643] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. + 7: [2023-05-10 12:37:39,644] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. + 7: [2023-05-10 12:37:39,644] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt... +17: [2023-05-10 12:37:39,644] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt... +29: [2023-05-10 12:37:39,645] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +29: [2023-05-10 12:37:39,645] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +29: [2023-05-10 12:37:39,645] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +29: [2023-05-10 12:37:39,645] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +29: [2023-05-10 12:37:39,645] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +29: [2023-05-10 12:37:39,645] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +29: [2023-05-10 12:37:39,645] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +10: [2023-05-10 12:37:39,645] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +13: [2023-05-10 12:37:39,646] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +13: [2023-05-10 12:37:39,646] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +13: [2023-05-10 12:37:39,646] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +13: [2023-05-10 12:37:39,646] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +14: [2023-05-10 12:37:39,646] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +14: [2023-05-10 12:37:39,646] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +10: [2023-05-10 12:37:39,646] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +14: [2023-05-10 12:37:39,647] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +14: [2023-05-10 12:37:39,647] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt... + 7: [2023-05-10 12:37:39,647] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. + 7: [2023-05-10 12:37:39,647] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt... +27: [2023-05-10 12:37:39,647] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +29: [2023-05-10 12:37:39,647] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... + 2: [2023-05-10 12:37:39,647] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... + 7: [2023-05-10 12:37:39,648] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. + 7: [2023-05-10 12:37:39,648] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. + 7: [2023-05-10 12:37:39,648] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt... +14: [2023-05-10 12:37:39,648] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +14: [2023-05-10 12:37:39,649] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +13: [2023-05-10 12:37:39,648] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +16: [2023-05-10 12:37:39,648] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +16: [2023-05-10 12:37:39,648] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +14: [2023-05-10 12:37:39,649] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. + 5: [2023-05-10 12:37:39,649] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +10: [2023-05-10 12:37:39,650] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +16: [2023-05-10 12:37:39,650] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt... +16: [2023-05-10 12:37:39,650] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt... +25: [2023-05-10 12:37:39,651] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +14: [2023-05-10 12:37:39,651] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +14: [2023-05-10 12:37:39,652] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... + 5: [2023-05-10 12:37:39,652] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +14: [2023-05-10 12:37:39,652] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +14: [2023-05-10 12:37:39,653] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. + 7: [2023-05-10 12:37:39,654] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +14: [2023-05-10 12:37:39,656] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt... + 7: [2023-05-10 12:37:39,657] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +29: [2023-05-10 12:37:39,657] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +29: [2023-05-10 12:37:39,658] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +10: [2023-05-10 12:37:39,658] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +15: [2023-05-10 12:37:39,658] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +15: [2023-05-10 12:37:39,658] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +15: [2023-05-10 12:37:39,658] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +29: [2023-05-10 12:37:39,658] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +10: [2023-05-10 12:37:39,659] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +15: [2023-05-10 12:37:39,659] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt. +15: [2023-05-10 12:37:39,659] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt. +15: [2023-05-10 12:37:39,660] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt. +25: [2023-05-10 12:37:39,660] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt. +25: [2023-05-10 12:37:39,660] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt. +14: [2023-05-10 12:37:39,660] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +25: [2023-05-10 12:37:39,661] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt. +25: [2023-05-10 12:37:39,661] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt. +25: [2023-05-10 12:37:39,661] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +18: [2023-05-10 12:37:39,661] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt. +18: [2023-05-10 12:37:39,661] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt. +18: [2023-05-10 12:37:39,661] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt. +18: [2023-05-10 12:37:39,661] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt. +14: [2023-05-10 12:37:39,662] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +14: [2023-05-10 12:37:39,662] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +15: [2023-05-10 12:37:39,663] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt. +13: [2023-05-10 12:37:39,663] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +14: [2023-05-10 12:37:39,665] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt... +13: [2023-05-10 12:37:39,666] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +14: [2023-05-10 12:37:39,666] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt... + 7: [2023-05-10 12:37:39,666] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. + 7: [2023-05-10 12:37:39,668] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt... +29: [2023-05-10 12:37:39,669] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +15: [2023-05-10 12:37:39,669] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +15: [2023-05-10 12:37:39,669] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +29: [2023-05-10 12:37:39,670] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +25: [2023-05-10 12:37:39,670] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +25: [2023-05-10 12:37:39,670] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +15: [2023-05-10 12:37:39,670] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +15: [2023-05-10 12:37:39,670] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +15: [2023-05-10 12:37:39,671] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +18: [2023-05-10 12:37:39,671] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +15: [2023-05-10 12:37:39,671] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +18: [2023-05-10 12:37:39,672] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +14: [2023-05-10 12:37:39,672] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +18: [2023-05-10 12:37:39,673] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +18: [2023-05-10 12:37:39,673] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +29: [2023-05-10 12:37:39,673] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +15: [2023-05-10 12:37:39,674] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +29: [2023-05-10 12:37:39,674] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +15: [2023-05-10 12:37:39,674] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +25: [2023-05-10 12:37:39,674] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +13: [2023-05-10 12:37:39,674] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +25: [2023-05-10 12:37:39,675] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +25: [2023-05-10 12:37:39,675] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +13: [2023-05-10 12:37:39,676] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +13: [2023-05-10 12:37:39,676] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +25: [2023-05-10 12:37:39,676] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +25: [2023-05-10 12:37:39,678] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +15: [2023-05-10 12:37:39,679] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +14: [2023-05-10 12:37:39,681] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +25: [2023-05-10 12:37:39,683] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +13: [2023-05-10 12:37:39,683] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +25: [2023-05-10 12:37:39,683] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +13: [2023-05-10 12:37:39,683] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +14: [2023-05-10 12:37:39,684] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +29: [2023-05-10 12:37:39,684] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +15: [2023-05-10 12:37:39,686] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +15: [2023-05-10 12:37:39,686] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt... +25: [2023-05-10 12:37:39,688] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +15: [2023-05-10 12:37:39,688] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +15: [2023-05-10 12:37:39,688] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt... +14: [2023-05-10 12:37:39,690] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +25: [2023-05-10 12:37:39,691] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +25: [2023-05-10 12:37:39,692] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt... +25: [2023-05-10 12:37:39,692] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +25: [2023-05-10 12:37:39,692] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt... + 8: [2023-05-10 12:37:39,692] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt. + 8: [2023-05-10 12:37:39,692] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt. + 8: [2023-05-10 12:37:39,692] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt. + 8: [2023-05-10 12:37:39,693] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt. +13: [2023-05-10 12:37:39,693] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +14: [2023-05-10 12:37:39,693] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +25: [2023-05-10 12:37:39,695] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +25: [2023-05-10 12:37:39,695] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt... +14: [2023-05-10 12:37:39,696] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +11: [2023-05-10 12:37:39,696] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +11: [2023-05-10 12:37:39,697] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +11: [2023-05-10 12:37:39,697] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +11: [2023-05-10 12:37:39,697] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +11: [2023-05-10 12:37:39,697] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +11: [2023-05-10 12:37:39,697] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +15: [2023-05-10 12:37:39,697] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +11: [2023-05-10 12:37:39,697] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +11: [2023-05-10 12:37:39,697] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +11: [2023-05-10 12:37:39,697] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt... +11: [2023-05-10 12:37:39,697] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +15: [2023-05-10 12:37:39,697] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt... +11: [2023-05-10 12:37:39,698] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +11: [2023-05-10 12:37:39,698] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt... +18: [2023-05-10 12:37:39,698] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. + 1: [2023-05-10 12:37:39,698] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. + 1: [2023-05-10 12:37:39,698] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. + 1: [2023-05-10 12:37:39,698] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. + 1: [2023-05-10 12:37:39,698] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +18: [2023-05-10 12:37:39,699] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt... +18: [2023-05-10 12:37:39,699] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +18: [2023-05-10 12:37:39,699] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +11: [2023-05-10 12:37:39,700] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt... + 0: [2023-05-10 12:37:39,700] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. + 0: [2023-05-10 12:37:39,700] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. + 0: [2023-05-10 12:37:39,700] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. + 0: [2023-05-10 12:37:39,700] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... + 0: [2023-05-10 12:37:39,700] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... + 0: [2023-05-10 12:37:39,700] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... + 0: [2023-05-10 12:37:39,700] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. + 0: [2023-05-10 12:37:39,700] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... + 1: [2023-05-10 12:37:39,700] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... + 1: [2023-05-10 12:37:39,700] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... + 1: [2023-05-10 12:37:39,700] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... + 9: [2023-05-10 12:37:39,700] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. + 9: [2023-05-10 12:37:39,700] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +11: [2023-05-10 12:37:39,701] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... + 4: [2023-05-10 12:37:39,700] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt. +18: [2023-05-10 12:37:39,701] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. + 1: [2023-05-10 12:37:39,701] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +11: [2023-05-10 12:37:39,701] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt... + 9: [2023-05-10 12:37:39,701] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. + 9: [2023-05-10 12:37:39,701] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. + 9: [2023-05-10 12:37:39,701] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +11: [2023-05-10 12:37:39,701] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... + 9: [2023-05-10 12:37:39,701] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. + 9: [2023-05-10 12:37:39,701] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. + 4: [2023-05-10 12:37:39,701] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt. + 9: [2023-05-10 12:37:39,701] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... + 4: [2023-05-10 12:37:39,701] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt. + 9: [2023-05-10 12:37:39,701] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. + 9: [2023-05-10 12:37:39,701] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt... + 9: [2023-05-10 12:37:39,701] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt... +14: [2023-05-10 12:37:39,701] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... + 4: [2023-05-10 12:37:39,701] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt. + 9: [2023-05-10 12:37:39,701] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt... + 8: [2023-05-10 12:37:39,701] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +21: [2023-05-10 12:37:39,702] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +21: [2023-05-10 12:37:39,702] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +18: [2023-05-10 12:37:39,702] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +18: [2023-05-10 12:37:39,702] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +18: [2023-05-10 12:37:39,702] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +21: [2023-05-10 12:37:39,702] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +21: [2023-05-10 12:37:39,702] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +18: [2023-05-10 12:37:39,702] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt... + 9: [2023-05-10 12:37:39,702] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... + 9: [2023-05-10 12:37:39,703] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt... + 9: [2023-05-10 12:37:39,703] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... + 8: [2023-05-10 12:37:39,704] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... + 9: [2023-05-10 12:37:39,704] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +18: [2023-05-10 12:37:39,705] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. + 8: [2023-05-10 12:37:39,705] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +18: [2023-05-10 12:37:39,705] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. + 8: [2023-05-10 12:37:39,705] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +21: [2023-05-10 12:37:39,705] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +21: [2023-05-10 12:37:39,705] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +21: [2023-05-10 12:37:39,705] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +18: [2023-05-10 12:37:39,706] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +18: [2023-05-10 12:37:39,706] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +18: [2023-05-10 12:37:39,706] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +15: [2023-05-10 12:37:39,707] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +26: [2023-05-10 12:37:39,707] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +26: [2023-05-10 12:37:39,707] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +26: [2023-05-10 12:37:39,707] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +26: [2023-05-10 12:37:39,707] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... + 0: [2023-05-10 12:37:39,708] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt. + 1: [2023-05-10 12:37:39,708] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt. + 1: [2023-05-10 12:37:39,708] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt. +18: [2023-05-10 12:37:39,708] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt... +25: [2023-05-10 12:37:39,708] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +18: [2023-05-10 12:37:39,708] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt... +15: [2023-05-10 12:37:39,709] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt... +26: [2023-05-10 12:37:39,709] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +26: [2023-05-10 12:37:39,709] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +26: [2023-05-10 12:37:39,709] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +26: [2023-05-10 12:37:39,709] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... + 1: [2023-05-10 12:37:39,709] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt. + 1: [2023-05-10 12:37:39,709] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt. +23: [2023-05-10 12:37:39,709] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +23: [2023-05-10 12:37:39,709] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +23: [2023-05-10 12:37:39,709] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +23: [2023-05-10 12:37:39,709] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +23: [2023-05-10 12:37:39,709] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +21: [2023-05-10 12:37:39,710] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +23: [2023-05-10 12:37:39,710] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +23: [2023-05-10 12:37:39,710] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... + 4: [2023-05-10 12:37:39,710] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... + 4: [2023-05-10 12:37:39,711] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +23: [2023-05-10 12:37:39,711] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +25: [2023-05-10 12:37:39,710] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt... + 0: [2023-05-10 12:37:39,712] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt. +11: [2023-05-10 12:37:39,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +11: [2023-05-10 12:37:39,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. + 4: [2023-05-10 12:37:39,713] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... + 4: [2023-05-10 12:37:39,713] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... + 9: [2023-05-10 12:37:39,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. + 0: [2023-05-10 12:37:39,715] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt. +21: [2023-05-10 12:37:39,715] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. + 8: [2023-05-10 12:37:39,716] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. + 0: [2023-05-10 12:37:39,716] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt. + 8: [2023-05-10 12:37:39,716] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt... +21: [2023-05-10 12:37:39,717] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. + 1: [2023-05-10 12:37:39,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... + 1: [2023-05-10 12:37:39,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +21: [2023-05-10 12:37:39,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +26: [2023-05-10 12:37:39,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +18: [2023-05-10 12:37:39,720] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +22: [2023-05-10 12:37:39,720] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt. +22: [2023-05-10 12:37:39,720] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt. +22: [2023-05-10 12:37:39,720] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt. +22: [2023-05-10 12:37:39,720] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt. + 1: [2023-05-10 12:37:39,720] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +26: [2023-05-10 12:37:39,721] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +23: [2023-05-10 12:37:39,721] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. + 0: [2023-05-10 12:37:39,722] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +19: [2023-05-10 12:37:39,722] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt. +19: [2023-05-10 12:37:39,722] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt. +19: [2023-05-10 12:37:39,722] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt. +19: [2023-05-10 12:37:39,722] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt. + 1: [2023-05-10 12:37:39,723] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +19: [2023-05-10 12:37:39,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +19: [2023-05-10 12:37:39,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +19: [2023-05-10 12:37:39,723] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +26: [2023-05-10 12:37:39,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +20: [2023-05-10 12:37:39,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt. +11: [2023-05-10 12:37:39,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +23: [2023-05-10 12:37:39,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +23: [2023-05-10 12:37:39,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +20: [2023-05-10 12:37:39,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt. +20: [2023-05-10 12:37:39,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt. +20: [2023-05-10 12:37:39,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt. +19: [2023-05-10 12:37:39,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +19: [2023-05-10 12:37:39,725] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +19: [2023-05-10 12:37:39,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +19: [2023-05-10 12:37:39,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +19: [2023-05-10 12:37:39,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +26: [2023-05-10 12:37:39,725] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. + 9: [2023-05-10 12:37:39,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... + 4: [2023-05-10 12:37:39,726] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. + 4: [2023-05-10 12:37:39,726] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. + 4: [2023-05-10 12:37:39,726] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt... + 4: [2023-05-10 12:37:39,726] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt... +11: [2023-05-10 12:37:39,726] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... + 3: [2023-05-10 12:37:39,728] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. + 3: [2023-05-10 12:37:39,728] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... + 0: [2023-05-10 12:37:39,728] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... + 3: [2023-05-10 12:37:39,729] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. + 8: [2023-05-10 12:37:39,729] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. + 3: [2023-05-10 12:37:39,729] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +30: [2023-05-10 12:37:39,729] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt. +30: [2023-05-10 12:37:39,729] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt. +26: [2023-05-10 12:37:39,730] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +26: [2023-05-10 12:37:39,730] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +22: [2023-05-10 12:37:39,730] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +22: [2023-05-10 12:37:39,730] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +30: [2023-05-10 12:37:39,730] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt. + 9: [2023-05-10 12:37:39,730] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. + 3: [2023-05-10 12:37:39,730] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +30: [2023-05-10 12:37:39,730] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt. + 0: [2023-05-10 12:37:39,730] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... + 3: [2023-05-10 12:37:39,730] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. + 3: [2023-05-10 12:37:39,731] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +22: [2023-05-10 12:37:39,731] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +23: [2023-05-10 12:37:39,731] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... + 0: [2023-05-10 12:37:39,731] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... + 1: [2023-05-10 12:37:39,730] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. + 1: [2023-05-10 12:37:39,730] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +21: [2023-05-10 12:37:39,731] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +18: [2023-05-10 12:37:39,731] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... + 8: [2023-05-10 12:37:39,731] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt... +11: [2023-05-10 12:37:39,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. + 3: [2023-05-10 12:37:39,732] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +22: [2023-05-10 12:37:39,732] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +11: [2023-05-10 12:37:39,732] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. + 2: [2023-05-10 12:37:39,732] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt. + 9: [2023-05-10 12:37:39,732] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. + 2: [2023-05-10 12:37:39,732] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt. + 2: [2023-05-10 12:37:39,732] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt. +19: [2023-05-10 12:37:39,732] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +28: [2023-05-10 12:37:39,733] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +28: [2023-05-10 12:37:39,733] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +23: [2023-05-10 12:37:39,733] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... + 2: [2023-05-10 12:37:39,733] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt. +28: [2023-05-10 12:37:39,733] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +19: [2023-05-10 12:37:39,733] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... + 1: [2023-05-10 12:37:39,733] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. + 9: [2023-05-10 12:37:39,733] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +21: [2023-05-10 12:37:39,734] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +21: [2023-05-10 12:37:39,734] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +28: [2023-05-10 12:37:39,734] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +28: [2023-05-10 12:37:39,734] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +28: [2023-05-10 12:37:39,734] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +28: [2023-05-10 12:37:39,734] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +20: [2023-05-10 12:37:39,734] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... + 8: [2023-05-10 12:37:39,734] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. + 8: [2023-05-10 12:37:39,734] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +20: [2023-05-10 12:37:39,734] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +26: [2023-05-10 12:37:39,735] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... + 1: [2023-05-10 12:37:39,735] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt... +20: [2023-05-10 12:37:39,735] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +20: [2023-05-10 12:37:39,735] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +19: [2023-05-10 12:37:39,735] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +23: [2023-05-10 12:37:39,735] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +28: [2023-05-10 12:37:39,735] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +26: [2023-05-10 12:37:39,736] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +23: [2023-05-10 12:37:39,736] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... + 8: [2023-05-10 12:37:39,736] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt... + 8: [2023-05-10 12:37:39,736] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt... + 9: [2023-05-10 12:37:39,738] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +19: [2023-05-10 12:37:39,738] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... + 1: [2023-05-10 12:37:39,739] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. + 1: [2023-05-10 12:37:39,740] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt... +22: [2023-05-10 12:37:39,739] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +22: [2023-05-10 12:37:39,740] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +30: [2023-05-10 12:37:39,740] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +30: [2023-05-10 12:37:39,740] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +22: [2023-05-10 12:37:39,740] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +22: [2023-05-10 12:37:39,740] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +22: [2023-05-10 12:37:39,740] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +22: [2023-05-10 12:37:39,740] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +22: [2023-05-10 12:37:39,740] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +22: [2023-05-10 12:37:39,740] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +30: [2023-05-10 12:37:39,740] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +30: [2023-05-10 12:37:39,740] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... + 0: [2023-05-10 12:37:39,740] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. + 0: [2023-05-10 12:37:39,740] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. + 0: [2023-05-10 12:37:39,740] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. + 0: [2023-05-10 12:37:39,741] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. + 1: [2023-05-10 12:37:39,741] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +19: [2023-05-10 12:37:39,740] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. + 1: [2023-05-10 12:37:39,741] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... + 1: [2023-05-10 12:37:39,741] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt... + 1: [2023-05-10 12:37:39,741] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... + 1: [2023-05-10 12:37:39,741] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. + 1: [2023-05-10 12:37:39,741] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. + 4: [2023-05-10 12:37:39,741] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. + 2: [2023-05-10 12:37:39,742] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... + 9: [2023-05-10 12:37:39,742] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... + 4: [2023-05-10 12:37:39,742] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +18: [2023-05-10 12:37:39,743] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +18: [2023-05-10 12:37:39,743] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +11: [2023-05-10 12:37:39,742] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +18: [2023-05-10 12:37:39,743] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +11: [2023-05-10 12:37:39,743] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... + 4: [2023-05-10 12:37:39,743] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt... +21: [2023-05-10 12:37:39,743] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. + 9: [2023-05-10 12:37:39,743] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... + 2: [2023-05-10 12:37:39,744] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... + 2: [2023-05-10 12:37:39,744] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... + 2: [2023-05-10 12:37:39,744] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +23: [2023-05-10 12:37:39,744] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt. +23: [2023-05-10 12:37:39,744] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt. +23: [2023-05-10 12:37:39,744] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt. +23: [2023-05-10 12:37:39,744] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt. + 4: [2023-05-10 12:37:39,744] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt... +29: [2023-05-10 12:37:39,745] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt. +29: [2023-05-10 12:37:39,745] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt. +29: [2023-05-10 12:37:39,745] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt. +29: [2023-05-10 12:37:39,745] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt. +23: [2023-05-10 12:37:39,746] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +22: [2023-05-10 12:37:39,746] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +19: [2023-05-10 12:37:39,746] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +19: [2023-05-10 12:37:39,748] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +22: [2023-05-10 12:37:39,749] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt... +19: [2023-05-10 12:37:39,749] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +22: [2023-05-10 12:37:39,749] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +22: [2023-05-10 12:37:39,750] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt... + 3: [2023-05-10 12:37:39,750] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. + 3: [2023-05-10 12:37:39,750] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. + 3: [2023-05-10 12:37:39,750] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. + 0: [2023-05-10 12:37:39,750] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. + 1: [2023-05-10 12:37:39,752] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... + 1: [2023-05-10 12:37:39,752] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +22: [2023-05-10 12:37:39,753] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +28: [2023-05-10 12:37:39,753] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +28: [2023-05-10 12:37:39,753] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +28: [2023-05-10 12:37:39,753] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +23: [2023-05-10 12:37:39,753] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... + 0: [2023-05-10 12:37:39,753] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt... +19: [2023-05-10 12:37:39,753] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +18: [2023-05-10 12:37:39,754] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +18: [2023-05-10 12:37:39,754] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +19: [2023-05-10 12:37:39,754] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +19: [2023-05-10 12:37:39,754] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt... +18: [2023-05-10 12:37:39,754] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +31: [2023-05-10 12:37:39,754] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +23: [2023-05-10 12:37:39,754] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... + 2: [2023-05-10 12:37:39,754] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +31: [2023-05-10 12:37:39,755] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... + 2: [2023-05-10 12:37:39,755] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt... +19: [2023-05-10 12:37:39,755] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt... +29: [2023-05-10 12:37:39,755] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +31: [2023-05-10 12:37:39,755] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +31: [2023-05-10 12:37:39,755] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +22: [2023-05-10 12:37:39,756] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +31: [2023-05-10 12:37:39,756] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +31: [2023-05-10 12:37:39,756] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +22: [2023-05-10 12:37:39,756] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt... +31: [2023-05-10 12:37:39,756] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +19: [2023-05-10 12:37:39,756] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +23: [2023-05-10 12:37:39,756] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +23: [2023-05-10 12:37:39,756] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... + 0: [2023-05-10 12:37:39,757] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +21: [2023-05-10 12:37:39,757] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... + 3: [2023-05-10 12:37:39,757] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +29: [2023-05-10 12:37:39,758] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +31: [2023-05-10 12:37:39,759] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +19: [2023-05-10 12:37:39,759] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +29: [2023-05-10 12:37:39,759] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +29: [2023-05-10 12:37:39,759] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +19: [2023-05-10 12:37:39,759] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +20: [2023-05-10 12:37:39,760] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +20: [2023-05-10 12:37:39,760] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +20: [2023-05-10 12:37:39,760] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +20: [2023-05-10 12:37:39,760] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +20: [2023-05-10 12:37:39,760] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +20: [2023-05-10 12:37:39,760] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. + 3: [2023-05-10 12:37:39,760] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +20: [2023-05-10 12:37:39,760] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... + 0: [2023-05-10 12:37:39,760] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +20: [2023-05-10 12:37:39,760] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +20: [2023-05-10 12:37:39,760] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +20: [2023-05-10 12:37:39,760] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +20: [2023-05-10 12:37:39,760] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +20: [2023-05-10 12:37:39,760] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +22: [2023-05-10 12:37:39,761] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +22: [2023-05-10 12:37:39,761] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +22: [2023-05-10 12:37:39,761] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +20: [2023-05-10 12:37:39,761] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt... +20: [2023-05-10 12:37:39,761] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt... +20: [2023-05-10 12:37:39,761] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt... +20: [2023-05-10 12:37:39,761] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt... + 1: [2023-05-10 12:37:39,761] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +27: [2023-05-10 12:37:39,761] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt. +27: [2023-05-10 12:37:39,761] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt. +27: [2023-05-10 12:37:39,761] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt. +27: [2023-05-10 12:37:39,761] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt. + 0: [2023-05-10 12:37:39,761] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... + 0: [2023-05-10 12:37:39,762] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +13: [2023-05-10 12:37:39,762] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt. +13: [2023-05-10 12:37:39,762] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt. +13: [2023-05-10 12:37:39,762] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt. +13: [2023-05-10 12:37:39,762] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt. +22: [2023-05-10 12:37:39,762] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. + 1: [2023-05-10 12:37:39,763] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt... + 3: [2023-05-10 12:37:39,763] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +22: [2023-05-10 12:37:39,763] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +28: [2023-05-10 12:37:39,764] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... + 3: [2023-05-10 12:37:39,764] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +22: [2023-05-10 12:37:39,764] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt... + 3: [2023-05-10 12:37:39,764] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt. +28: [2023-05-10 12:37:39,764] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... + 3: [2023-05-10 12:37:39,764] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt. + 3: [2023-05-10 12:37:39,765] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt. + 3: [2023-05-10 12:37:39,765] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt. +28: [2023-05-10 12:37:39,765] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +31: [2023-05-10 12:37:39,766] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +28: [2023-05-10 12:37:39,767] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +31: [2023-05-10 12:37:39,767] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. + 0: [2023-05-10 12:37:39,767] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. + 5: [2023-05-10 12:37:39,767] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt. + 5: [2023-05-10 12:37:39,767] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt. +19: [2023-05-10 12:37:39,767] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... + 5: [2023-05-10 12:37:39,767] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt. + 0: [2023-05-10 12:37:39,768] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt... + 5: [2023-05-10 12:37:39,768] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt. + 3: [2023-05-10 12:37:39,768] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +19: [2023-05-10 12:37:39,768] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +30: [2023-05-10 12:37:39,768] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +30: [2023-05-10 12:37:39,768] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +30: [2023-05-10 12:37:39,768] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +30: [2023-05-10 12:37:39,769] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +30: [2023-05-10 12:37:39,769] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +30: [2023-05-10 12:37:39,769] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt... + 0: [2023-05-10 12:37:39,769] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. + 0: [2023-05-10 12:37:39,769] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt... +30: [2023-05-10 12:37:39,769] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +30: [2023-05-10 12:37:39,769] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +19: [2023-05-10 12:37:39,769] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt... +30: [2023-05-10 12:37:39,769] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt... +30: [2023-05-10 12:37:39,769] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +30: [2023-05-10 12:37:39,769] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt... +30: [2023-05-10 12:37:39,769] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +30: [2023-05-10 12:37:39,769] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt... +30: [2023-05-10 12:37:39,769] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +30: [2023-05-10 12:37:39,769] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +19: [2023-05-10 12:37:39,769] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +30: [2023-05-10 12:37:39,769] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +31: [2023-05-10 12:37:39,769] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +22: [2023-05-10 12:37:39,770] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +23: [2023-05-10 12:37:39,769] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +23: [2023-05-10 12:37:39,770] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +29: [2023-05-10 12:37:39,770] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +23: [2023-05-10 12:37:39,770] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt... +23: [2023-05-10 12:37:39,770] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt... +22: [2023-05-10 12:37:39,770] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +22: [2023-05-10 12:37:39,771] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... + 2: [2023-05-10 12:37:39,770] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. + 2: [2023-05-10 12:37:39,771] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +27: [2023-05-10 12:37:39,771] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... + 2: [2023-05-10 12:37:39,771] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +19: [2023-05-10 12:37:39,771] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt... +29: [2023-05-10 12:37:39,772] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt... +27: [2023-05-10 12:37:39,772] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... + 6: [2023-05-10 12:37:39,772] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt. + 6: [2023-05-10 12:37:39,773] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt. + 6: [2023-05-10 12:37:39,773] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt. + 6: [2023-05-10 12:37:39,773] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt. + 2: [2023-05-10 12:37:39,773] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt... + 2: [2023-05-10 12:37:39,773] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt... +13: [2023-05-10 12:37:39,773] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... + 2: [2023-05-10 12:37:39,773] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt... + 0: [2023-05-10 12:37:39,774] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. + 0: [2023-05-10 12:37:39,774] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt... +20: [2023-05-10 12:37:39,774] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +20: [2023-05-10 12:37:39,774] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +13: [2023-05-10 12:37:39,774] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... + 3: [2023-05-10 12:37:39,774] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +13: [2023-05-10 12:37:39,775] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +20: [2023-05-10 12:37:39,775] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +28: [2023-05-10 12:37:39,775] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +13: [2023-05-10 12:37:39,775] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +27: [2023-05-10 12:37:39,776] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +27: [2023-05-10 12:37:39,776] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... + 3: [2023-05-10 12:37:39,776] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... + 3: [2023-05-10 12:37:39,777] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... + 5: [2023-05-10 12:37:39,777] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +31: [2023-05-10 12:37:39,778] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... + 5: [2023-05-10 12:37:39,778] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +29: [2023-05-10 12:37:39,778] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +29: [2023-05-10 12:37:39,778] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt... + 5: [2023-05-10 12:37:39,779] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... + 5: [2023-05-10 12:37:39,779] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... + 3: [2023-05-10 12:37:39,779] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +21: [2023-05-10 12:37:39,779] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt. +21: [2023-05-10 12:37:39,779] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt. +21: [2023-05-10 12:37:39,779] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt. +21: [2023-05-10 12:37:39,779] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_07-model_01-model_states.pt. +30: [2023-05-10 12:37:39,780] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +31: [2023-05-10 12:37:39,781] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... + 6: [2023-05-10 12:37:39,782] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... + 6: [2023-05-10 12:37:39,782] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... + 6: [2023-05-10 12:37:39,782] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +29: [2023-05-10 12:37:39,782] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +20: [2023-05-10 12:37:39,783] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +29: [2023-05-10 12:37:39,784] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt... + 6: [2023-05-10 12:37:39,784] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +29: [2023-05-10 12:37:39,784] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +20: [2023-05-10 12:37:39,784] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +20: [2023-05-10 12:37:39,784] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +27: [2023-05-10 12:37:39,784] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +23: [2023-05-10 12:37:39,785] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +23: [2023-05-10 12:37:39,785] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +20: [2023-05-10 12:37:39,785] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +29: [2023-05-10 12:37:39,785] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt... +27: [2023-05-10 12:37:39,786] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt... +30: [2023-05-10 12:37:39,786] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +27: [2023-05-10 12:37:39,786] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +27: [2023-05-10 12:37:39,786] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt... +23: [2023-05-10 12:37:39,787] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt... +23: [2023-05-10 12:37:39,787] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt... +31: [2023-05-10 12:37:39,787] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +31: [2023-05-10 12:37:39,788] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +13: [2023-05-10 12:37:39,787] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +13: [2023-05-10 12:37:39,788] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt... + 3: [2023-05-10 12:37:39,789] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +13: [2023-05-10 12:37:39,789] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +13: [2023-05-10 12:37:39,789] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt... +30: [2023-05-10 12:37:39,789] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. + 3: [2023-05-10 12:37:39,789] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt... + 5: [2023-05-10 12:37:39,790] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +30: [2023-05-10 12:37:39,790] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. + 5: [2023-05-10 12:37:39,790] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt... +21: [2023-05-10 12:37:39,791] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... + 3: [2023-05-10 12:37:39,791] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. + 3: [2023-05-10 12:37:39,791] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt... +30: [2023-05-10 12:37:39,791] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +20: [2023-05-10 12:37:39,792] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +21: [2023-05-10 12:37:39,794] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... + 5: [2023-05-10 12:37:39,795] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. + 5: [2023-05-10 12:37:39,795] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt... +21: [2023-05-10 12:37:39,796] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... + 5: [2023-05-10 12:37:39,796] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. + 5: [2023-05-10 12:37:39,796] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt... +21: [2023-05-10 12:37:39,796] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt... +31: [2023-05-10 12:37:39,798] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +30: [2023-05-10 12:37:39,798] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +30: [2023-05-10 12:37:39,799] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +30: [2023-05-10 12:37:39,801] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +13: [2023-05-10 12:37:39,801] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +27: [2023-05-10 12:37:39,802] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +13: [2023-05-10 12:37:39,803] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt... + 3: [2023-05-10 12:37:39,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +27: [2023-05-10 12:37:39,804] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt... +13: [2023-05-10 12:37:39,805] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. + 3: [2023-05-10 12:37:39,805] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt... + 3: [2023-05-10 12:37:39,805] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +27: [2023-05-10 12:37:39,806] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +21: [2023-05-10 12:37:39,806] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +21: [2023-05-10 12:37:39,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt... +13: [2023-05-10 12:37:39,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt... + 4: [2023-05-10 12:37:39,807] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. + 4: [2023-05-10 12:37:39,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... + 4: [2023-05-10 12:37:39,807] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. + 4: [2023-05-10 12:37:39,807] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +27: [2023-05-10 12:37:39,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt... + 3: [2023-05-10 12:37:39,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt... + 4: [2023-05-10 12:37:39,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... + 4: [2023-05-10 12:37:39,807] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +21: [2023-05-10 12:37:39,808] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +21: [2023-05-10 12:37:39,808] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt... + 4: [2023-05-10 12:37:39,809] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... + 4: [2023-05-10 12:37:39,809] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... + 5: [2023-05-10 12:37:39,811] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. + 5: [2023-05-10 12:37:39,813] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt... +26: [2023-05-10 12:37:39,814] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt. +26: [2023-05-10 12:37:39,814] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt. +26: [2023-05-10 12:37:39,814] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt. +26: [2023-05-10 12:37:39,814] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt. +26: [2023-05-10 12:37:39,823] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... + 4: [2023-05-10 12:37:39,823] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. + 4: [2023-05-10 12:37:39,823] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +21: [2023-05-10 12:37:39,824] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +26: [2023-05-10 12:37:39,824] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +26: [2023-05-10 12:37:39,825] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... + 4: [2023-05-10 12:37:39,825] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +26: [2023-05-10 12:37:39,825] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +21: [2023-05-10 12:37:39,826] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_00-model_states.pt. +21: [2023-05-10 12:37:39,827] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt... +21: [2023-05-10 12:37:39,829] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt... +25: [2023-05-10 12:37:39,832] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +25: [2023-05-10 12:37:39,832] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +25: [2023-05-10 12:37:39,832] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +25: [2023-05-10 12:37:39,832] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +25: [2023-05-10 12:37:39,833] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +25: [2023-05-10 12:37:39,833] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +25: [2023-05-10 12:37:39,833] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +25: [2023-05-10 12:37:39,833] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... + 4: [2023-05-10 12:37:39,835] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... + 4: [2023-05-10 12:37:39,835] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... + 4: [2023-05-10 12:37:39,835] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... + 4: [2023-05-10 12:37:39,838] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +12: [2023-05-10 12:37:39,840] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +12: [2023-05-10 12:37:39,840] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +12: [2023-05-10 12:37:39,840] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +12: [2023-05-10 12:37:39,840] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +12: [2023-05-10 12:37:39,841] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +12: [2023-05-10 12:37:39,841] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +12: [2023-05-10 12:37:39,841] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +12: [2023-05-10 12:37:39,841] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +26: [2023-05-10 12:37:39,842] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +26: [2023-05-10 12:37:39,843] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt... +16: [2023-05-10 12:37:39,843] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +16: [2023-05-10 12:37:39,843] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +16: [2023-05-10 12:37:39,843] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +16: [2023-05-10 12:37:39,843] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +16: [2023-05-10 12:37:39,843] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +26: [2023-05-10 12:37:39,843] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +16: [2023-05-10 12:37:39,843] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +26: [2023-05-10 12:37:39,843] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +26: [2023-05-10 12:37:39,843] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt... +16: [2023-05-10 12:37:39,843] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +26: [2023-05-10 12:37:39,844] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt... +16: [2023-05-10 12:37:39,845] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +25: [2023-05-10 12:37:39,845] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +25: [2023-05-10 12:37:39,845] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +26: [2023-05-10 12:37:39,847] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. + 4: [2023-05-10 12:37:39,848] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +25: [2023-05-10 12:37:39,848] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +26: [2023-05-10 12:37:39,849] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt... +25: [2023-05-10 12:37:39,849] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. + 6: [2023-05-10 12:37:39,850] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. + 6: [2023-05-10 12:37:39,850] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. + 6: [2023-05-10 12:37:39,850] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. + 6: [2023-05-10 12:37:39,850] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. + 6: [2023-05-10 12:37:39,850] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. + 6: [2023-05-10 12:37:39,850] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. + 6: [2023-05-10 12:37:39,850] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. + 6: [2023-05-10 12:37:39,850] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... + 6: [2023-05-10 12:37:39,850] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... + 6: [2023-05-10 12:37:39,850] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... + 6: [2023-05-10 12:37:39,851] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. + 6: [2023-05-10 12:37:39,851] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt... + 6: [2023-05-10 12:37:39,851] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt... + 6: [2023-05-10 12:37:39,851] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt... + 6: [2023-05-10 12:37:39,851] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt... + 6: [2023-05-10 12:37:39,851] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... + 8: [2023-05-10 12:37:39,851] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. + 8: [2023-05-10 12:37:39,851] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. + 8: [2023-05-10 12:37:39,851] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. + 8: [2023-05-10 12:37:39,851] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... + 8: [2023-05-10 12:37:39,851] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +10: [2023-05-10 12:37:39,852] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +10: [2023-05-10 12:37:39,852] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +10: [2023-05-10 12:37:39,853] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... + 8: [2023-05-10 12:37:39,853] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +10: [2023-05-10 12:37:39,854] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... + 8: [2023-05-10 12:37:39,854] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +12: [2023-05-10 12:37:39,854] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +25: [2023-05-10 12:37:39,855] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... + 8: [2023-05-10 12:37:39,855] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +16: [2023-05-10 12:37:39,855] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +27: [2023-05-10 12:37:39,856] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +27: [2023-05-10 12:37:39,856] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +27: [2023-05-10 12:37:39,856] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +27: [2023-05-10 12:37:39,856] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +16: [2023-05-10 12:37:39,856] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +25: [2023-05-10 12:37:39,856] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +10: [2023-05-10 12:37:39,856] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +10: [2023-05-10 12:37:39,856] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +10: [2023-05-10 12:37:39,856] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +12: [2023-05-10 12:37:39,856] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +10: [2023-05-10 12:37:39,858] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +27: [2023-05-10 12:37:39,858] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +27: [2023-05-10 12:37:39,859] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +27: [2023-05-10 12:37:39,859] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +16: [2023-05-10 12:37:39,859] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +25: [2023-05-10 12:37:39,860] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +25: [2023-05-10 12:37:39,861] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +27: [2023-05-10 12:37:39,861] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +12: [2023-05-10 12:37:39,863] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... + 6: [2023-05-10 12:37:39,864] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +16: [2023-05-10 12:37:39,865] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +14: [2023-05-10 12:37:39,865] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt. + 6: [2023-05-10 12:37:39,865] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. + 6: [2023-05-10 12:37:39,865] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +28: [2023-05-10 12:37:39,866] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt. +14: [2023-05-10 12:37:39,866] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt. +28: [2023-05-10 12:37:39,866] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt. +28: [2023-05-10 12:37:39,866] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt. +28: [2023-05-10 12:37:39,866] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt. +14: [2023-05-10 12:37:39,867] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt. +16: [2023-05-10 12:37:39,868] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +14: [2023-05-10 12:37:39,868] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt. +12: [2023-05-10 12:37:39,869] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +27: [2023-05-10 12:37:39,869] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +10: [2023-05-10 12:37:39,869] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +12: [2023-05-10 12:37:39,869] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +16: [2023-05-10 12:37:39,870] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +27: [2023-05-10 12:37:39,870] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +12: [2023-05-10 12:37:39,870] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. + 8: [2023-05-10 12:37:39,870] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. + 2: [2023-05-10 12:37:39,871] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. + 2: [2023-05-10 12:37:39,871] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. + 2: [2023-05-10 12:37:39,871] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +10: [2023-05-10 12:37:39,871] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. + 2: [2023-05-10 12:37:39,871] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... + 2: [2023-05-10 12:37:39,871] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. + 2: [2023-05-10 12:37:39,871] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. + 2: [2023-05-10 12:37:39,871] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... + 2: [2023-05-10 12:37:39,872] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... + 8: [2023-05-10 12:37:39,872] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +12: [2023-05-10 12:37:39,873] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt. +12: [2023-05-10 12:37:39,873] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt. + 6: [2023-05-10 12:37:39,873] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +16: [2023-05-10 12:37:39,873] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +18: [2023-05-10 12:37:39,873] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt. +12: [2023-05-10 12:37:39,874] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt. +18: [2023-05-10 12:37:39,874] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt. + 6: [2023-05-10 12:37:39,874] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +12: [2023-05-10 12:37:39,875] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt. + 6: [2023-05-10 12:37:39,875] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... + 6: [2023-05-10 12:37:39,877] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +27: [2023-05-10 12:37:39,878] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +18: [2023-05-10 12:37:39,878] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt. +18: [2023-05-10 12:37:39,878] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt. + 8: [2023-05-10 12:37:39,878] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +12: [2023-05-10 12:37:39,879] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +14: [2023-05-10 12:37:39,879] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +10: [2023-05-10 12:37:39,879] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +27: [2023-05-10 12:37:39,879] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +14: [2023-05-10 12:37:39,879] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +14: [2023-05-10 12:37:39,879] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +10: [2023-05-10 12:37:39,880] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt. +10: [2023-05-10 12:37:39,880] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt. + 8: [2023-05-10 12:37:39,881] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +14: [2023-05-10 12:37:39,881] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +28: [2023-05-10 12:37:39,881] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... + 8: [2023-05-10 12:37:39,881] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +28: [2023-05-10 12:37:39,881] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +16: [2023-05-10 12:37:39,882] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... + 6: [2023-05-10 12:37:39,882] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +27: [2023-05-10 12:37:39,882] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... + 2: [2023-05-10 12:37:39,882] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. + 2: [2023-05-10 12:37:39,883] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +28: [2023-05-10 12:37:39,884] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +28: [2023-05-10 12:37:39,884] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +10: [2023-05-10 12:37:39,884] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt. +12: [2023-05-10 12:37:39,884] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +10: [2023-05-10 12:37:39,884] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +12: [2023-05-10 12:37:39,884] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +12: [2023-05-10 12:37:39,885] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +18: [2023-05-10 12:37:39,885] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +10: [2023-05-10 12:37:39,885] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt. +10: [2023-05-10 12:37:39,885] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +18: [2023-05-10 12:37:39,885] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... + 8: [2023-05-10 12:37:39,885] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +25: [2023-05-10 12:37:39,887] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt. +25: [2023-05-10 12:37:39,887] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt. +12: [2023-05-10 12:37:39,887] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +25: [2023-05-10 12:37:39,887] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt. + 8: [2023-05-10 12:37:39,887] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +25: [2023-05-10 12:37:39,887] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt. +12: [2023-05-10 12:37:39,887] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... + 2: [2023-05-10 12:37:39,887] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. + 2: [2023-05-10 12:37:39,888] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +27: [2023-05-10 12:37:39,889] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +18: [2023-05-10 12:37:39,889] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +18: [2023-05-10 12:37:39,889] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... + 7: [2023-05-10 12:37:39,890] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. + 7: [2023-05-10 12:37:39,890] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... + 7: [2023-05-10 12:37:39,891] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. + 2: [2023-05-10 12:37:39,891] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +10: [2023-05-10 12:37:39,891] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +10: [2023-05-10 12:37:39,892] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +10: [2023-05-10 12:37:39,892] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... + 7: [2023-05-10 12:37:39,893] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +27: [2023-05-10 12:37:39,893] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. + 2: [2023-05-10 12:37:39,893] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +15: [2023-05-10 12:37:39,894] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt. +15: [2023-05-10 12:37:39,894] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt. +15: [2023-05-10 12:37:39,894] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt. + 8: [2023-05-10 12:37:39,895] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +15: [2023-05-10 12:37:39,895] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt. + 7: [2023-05-10 12:37:39,895] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. + 7: [2023-05-10 12:37:39,895] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... + 7: [2023-05-10 12:37:39,895] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. + 7: [2023-05-10 12:37:39,895] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +10: [2023-05-10 12:37:39,896] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +12: [2023-05-10 12:37:39,896] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +28: [2023-05-10 12:37:39,895] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +28: [2023-05-10 12:37:39,896] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt... +10: [2023-05-10 12:37:39,897] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +25: [2023-05-10 12:37:39,898] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +12: [2023-05-10 12:37:39,898] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt... +25: [2023-05-10 12:37:39,898] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... + 2: [2023-05-10 12:37:39,898] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +25: [2023-05-10 12:37:39,898] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +12: [2023-05-10 12:37:39,898] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +12: [2023-05-10 12:37:39,899] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt... +17: [2023-05-10 12:37:39,899] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +17: [2023-05-10 12:37:39,899] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +17: [2023-05-10 12:37:39,899] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +17: [2023-05-10 12:37:39,899] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +17: [2023-05-10 12:37:39,899] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +17: [2023-05-10 12:37:39,899] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +17: [2023-05-10 12:37:39,899] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +10: [2023-05-10 12:37:39,899] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +17: [2023-05-10 12:37:39,899] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... + 2: [2023-05-10 12:37:39,899] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +11: [2023-05-10 12:37:39,899] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +11: [2023-05-10 12:37:39,900] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +25: [2023-05-10 12:37:39,900] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +28: [2023-05-10 12:37:39,900] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +28: [2023-05-10 12:37:39,900] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt... + 1: [2023-05-10 12:37:39,900] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. + 1: [2023-05-10 12:37:39,900] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. + 1: [2023-05-10 12:37:39,900] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... + 1: [2023-05-10 12:37:39,900] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +12: [2023-05-10 12:37:39,901] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +11: [2023-05-10 12:37:39,901] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +11: [2023-05-10 12:37:39,901] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +14: [2023-05-10 12:37:39,901] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +14: [2023-05-10 12:37:39,901] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +14: [2023-05-10 12:37:39,901] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +14: [2023-05-10 12:37:39,902] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +14: [2023-05-10 12:37:39,902] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +14: [2023-05-10 12:37:39,902] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +14: [2023-05-10 12:37:39,902] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +27: [2023-05-10 12:37:39,902] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +14: [2023-05-10 12:37:39,902] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +14: [2023-05-10 12:37:39,902] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... + 1: [2023-05-10 12:37:39,902] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +14: [2023-05-10 12:37:39,902] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt... +14: [2023-05-10 12:37:39,902] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt... + 1: [2023-05-10 12:37:39,902] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +12: [2023-05-10 12:37:39,902] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt... +14: [2023-05-10 12:37:39,903] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +10: [2023-05-10 12:37:39,903] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +14: [2023-05-10 12:37:39,903] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt... + 9: [2023-05-10 12:37:39,903] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. + 9: [2023-05-10 12:37:39,903] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... + 1: [2023-05-10 12:37:39,903] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. + 1: [2023-05-10 12:37:39,903] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +14: [2023-05-10 12:37:39,903] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +14: [2023-05-10 12:37:39,904] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt... +15: [2023-05-10 12:37:39,904] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +14: [2023-05-10 12:37:39,904] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +16: [2023-05-10 12:37:39,904] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt. +16: [2023-05-10 12:37:39,904] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt. +16: [2023-05-10 12:37:39,905] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt. + 9: [2023-05-10 12:37:39,905] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +16: [2023-05-10 12:37:39,905] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt. + 9: [2023-05-10 12:37:39,905] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +15: [2023-05-10 12:37:39,906] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +15: [2023-05-10 12:37:39,906] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +12: [2023-05-10 12:37:39,905] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +12: [2023-05-10 12:37:39,906] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt... +11: [2023-05-10 12:37:39,906] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +11: [2023-05-10 12:37:39,906] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +28: [2023-05-10 12:37:39,907] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +24: [2023-05-10 12:37:39,907] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +28: [2023-05-10 12:37:39,907] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +24: [2023-05-10 12:37:39,907] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... + 7: [2023-05-10 12:37:39,907] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. + 7: [2023-05-10 12:37:39,907] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +11: [2023-05-10 12:37:39,907] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +11: [2023-05-10 12:37:39,908] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +24: [2023-05-10 12:37:39,907] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +24: [2023-05-10 12:37:39,907] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +28: [2023-05-10 12:37:39,908] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt... + 9: [2023-05-10 12:37:39,908] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. + 9: [2023-05-10 12:37:39,908] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +24: [2023-05-10 12:37:39,908] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +24: [2023-05-10 12:37:39,908] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. + 9: [2023-05-10 12:37:39,908] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... + 9: [2023-05-10 12:37:39,908] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +15: [2023-05-10 12:37:39,908] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +24: [2023-05-10 12:37:39,908] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +10: [2023-05-10 12:37:39,908] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +28: [2023-05-10 12:37:39,909] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt... +10: [2023-05-10 12:37:39,909] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt... +24: [2023-05-10 12:37:39,910] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +17: [2023-05-10 12:37:39,911] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +25: [2023-05-10 12:37:39,911] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. + 7: [2023-05-10 12:37:39,911] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt. +10: [2023-05-10 12:37:39,911] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +10: [2023-05-10 12:37:39,911] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +10: [2023-05-10 12:37:39,911] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt... +10: [2023-05-10 12:37:39,911] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt... +25: [2023-05-10 12:37:39,912] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt... +10: [2023-05-10 12:37:39,912] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +10: [2023-05-10 12:37:39,912] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt... +17: [2023-05-10 12:37:39,912] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. + 7: [2023-05-10 12:37:39,912] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt. + 7: [2023-05-10 12:37:39,912] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt. +25: [2023-05-10 12:37:39,912] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +25: [2023-05-10 12:37:39,913] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt... +24: [2023-05-10 12:37:39,913] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt. +17: [2023-05-10 12:37:39,913] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt. +17: [2023-05-10 12:37:39,913] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt. +14: [2023-05-10 12:37:39,913] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +24: [2023-05-10 12:37:39,913] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt. +24: [2023-05-10 12:37:39,913] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt. +11: [2023-05-10 12:37:39,913] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +16: [2023-05-10 12:37:39,914] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +24: [2023-05-10 12:37:39,914] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt. +16: [2023-05-10 12:37:39,914] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +14: [2023-05-10 12:37:39,914] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +14: [2023-05-10 12:37:39,915] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. + 8: [2023-05-10 12:37:39,915] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt. +16: [2023-05-10 12:37:39,915] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... + 8: [2023-05-10 12:37:39,915] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt. +16: [2023-05-10 12:37:39,915] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +31: [2023-05-10 12:37:39,915] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt. +31: [2023-05-10 12:37:39,916] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt. +11: [2023-05-10 12:37:39,915] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. + 7: [2023-05-10 12:37:39,916] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +17: [2023-05-10 12:37:39,916] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt. +11: [2023-05-10 12:37:39,917] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt. + 1: [2023-05-10 12:37:39,917] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. + 7: [2023-05-10 12:37:39,917] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +31: [2023-05-10 12:37:39,917] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt. + 1: [2023-05-10 12:37:39,917] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt. +17: [2023-05-10 12:37:39,917] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +17: [2023-05-10 12:37:39,917] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +31: [2023-05-10 12:37:39,917] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt. + 9: [2023-05-10 12:37:39,917] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt. + 9: [2023-05-10 12:37:39,917] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt. + 9: [2023-05-10 12:37:39,917] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt. +11: [2023-05-10 12:37:39,917] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt. + 1: [2023-05-10 12:37:39,917] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. + 9: [2023-05-10 12:37:39,917] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt. + 8: [2023-05-10 12:37:39,917] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt. +17: [2023-05-10 12:37:39,918] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt. + 8: [2023-05-10 12:37:39,918] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt. + 9: [2023-05-10 12:37:39,918] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. + 2: [2023-05-10 12:37:39,918] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt. + 7: [2023-05-10 12:37:39,918] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt. + 4: [2023-05-10 12:37:39,919] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt. + 4: [2023-05-10 12:37:39,919] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt. + 1: [2023-05-10 12:37:39,918] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt. + 2: [2023-05-10 12:37:39,919] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt. +13: [2023-05-10 12:37:39,920] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +23: [2023-05-10 12:37:39,920] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt. +23: [2023-05-10 12:37:39,920] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt. +13: [2023-05-10 12:37:39,920] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +25: [2023-05-10 12:37:39,920] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +25: [2023-05-10 12:37:39,920] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt... + 5: [2023-05-10 12:37:39,920] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. + 5: [2023-05-10 12:37:39,920] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +25: [2023-05-10 12:37:39,920] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +11: [2023-05-10 12:37:39,920] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt. + 5: [2023-05-10 12:37:39,920] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... + 5: [2023-05-10 12:37:39,920] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +13: [2023-05-10 12:37:39,920] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +13: [2023-05-10 12:37:39,920] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +25: [2023-05-10 12:37:39,920] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt... +13: [2023-05-10 12:37:39,920] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +13: [2023-05-10 12:37:39,920] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +13: [2023-05-10 12:37:39,920] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. + 5: [2023-05-10 12:37:39,920] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. + 5: [2023-05-10 12:37:39,921] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... + 4: [2023-05-10 12:37:39,921] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt. +21: [2023-05-10 12:37:39,921] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +21: [2023-05-10 12:37:39,921] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +21: [2023-05-10 12:37:39,921] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +11: [2023-05-10 12:37:39,921] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt. + 5: [2023-05-10 12:37:39,921] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +15: [2023-05-10 12:37:39,920] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +15: [2023-05-10 12:37:39,921] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +15: [2023-05-10 12:37:39,921] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. + 5: [2023-05-10 12:37:39,921] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... + 7: [2023-05-10 12:37:39,921] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... + 2: [2023-05-10 12:37:39,921] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt. + 4: [2023-05-10 12:37:39,921] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt. +15: [2023-05-10 12:37:39,921] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +15: [2023-05-10 12:37:39,921] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +15: [2023-05-10 12:37:39,921] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. + 9: [2023-05-10 12:37:39,921] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. + 2: [2023-05-10 12:37:39,922] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt. + 1: [2023-05-10 12:37:39,922] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. + 1: [2023-05-10 12:37:39,922] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt. +23: [2023-05-10 12:37:39,922] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt. + 9: [2023-05-10 12:37:39,922] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +18: [2023-05-10 12:37:39,922] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +18: [2023-05-10 12:37:39,922] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +23: [2023-05-10 12:37:39,922] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt. +13: [2023-05-10 12:37:39,922] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +17: [2023-05-10 12:37:39,922] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +18: [2023-05-10 12:37:39,923] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt... +18: [2023-05-10 12:37:39,923] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt... +18: [2023-05-10 12:37:39,923] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +18: [2023-05-10 12:37:39,923] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +18: [2023-05-10 12:37:39,923] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +18: [2023-05-10 12:37:39,923] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +18: [2023-05-10 12:37:39,923] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +18: [2023-05-10 12:37:39,923] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +18: [2023-05-10 12:37:39,923] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt... +18: [2023-05-10 12:37:39,923] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +18: [2023-05-10 12:37:39,923] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt... +18: [2023-05-10 12:37:39,923] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. + 1: [2023-05-10 12:37:39,923] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +18: [2023-05-10 12:37:39,923] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +21: [2023-05-10 12:37:39,923] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +21: [2023-05-10 12:37:39,923] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +21: [2023-05-10 12:37:39,923] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +21: [2023-05-10 12:37:39,923] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +21: [2023-05-10 12:37:39,923] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +24: [2023-05-10 12:37:39,923] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... + 7: [2023-05-10 12:37:39,924] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... + 7: [2023-05-10 12:37:39,924] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +24: [2023-05-10 12:37:39,924] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +24: [2023-05-10 12:37:39,924] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +24: [2023-05-10 12:37:39,924] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +18: [2023-05-10 12:37:39,924] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +17: [2023-05-10 12:37:39,925] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... + 7: [2023-05-10 12:37:39,925] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +17: [2023-05-10 12:37:39,925] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +17: [2023-05-10 12:37:39,925] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... + 8: [2023-05-10 12:37:39,925] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +24: [2023-05-10 12:37:39,925] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... + 8: [2023-05-10 12:37:39,925] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... + 1: [2023-05-10 12:37:39,925] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt. + 5: [2023-05-10 12:37:39,926] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt. + 0: [2023-05-10 12:37:39,926] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +24: [2023-05-10 12:37:39,926] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. + 0: [2023-05-10 12:37:39,926] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. + 0: [2023-05-10 12:37:39,926] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. + 0: [2023-05-10 12:37:39,926] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... + 0: [2023-05-10 12:37:39,926] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... + 5: [2023-05-10 12:37:39,926] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt. + 0: [2023-05-10 12:37:39,926] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. + 0: [2023-05-10 12:37:39,927] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... + 5: [2023-05-10 12:37:39,927] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt. + 7: [2023-05-10 12:37:39,927] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +11: [2023-05-10 12:37:39,927] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +24: [2023-05-10 12:37:39,927] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. + 1: [2023-05-10 12:37:39,927] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... + 8: [2023-05-10 12:37:39,928] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... + 8: [2023-05-10 12:37:39,928] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +11: [2023-05-10 12:37:39,928] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... + 0: [2023-05-10 12:37:39,928] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +14: [2023-05-10 12:37:39,928] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... + 1: [2023-05-10 12:37:39,928] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +31: [2023-05-10 12:37:39,928] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... + 2: [2023-05-10 12:37:39,928] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... + 2: [2023-05-10 12:37:39,928] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +14: [2023-05-10 12:37:39,928] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... + 9: [2023-05-10 12:37:39,928] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +17: [2023-05-10 12:37:39,929] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +31: [2023-05-10 12:37:39,929] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... + 9: [2023-05-10 12:37:39,929] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... + 7: [2023-05-10 12:37:39,929] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... + 7: [2023-05-10 12:37:39,929] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +14: [2023-05-10 12:37:39,929] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... + 9: [2023-05-10 12:37:39,929] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +17: [2023-05-10 12:37:39,929] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... + 5: [2023-05-10 12:37:39,929] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt. +17: [2023-05-10 12:37:39,929] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +17: [2023-05-10 12:37:39,929] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +23: [2023-05-10 12:37:39,929] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... + 1: [2023-05-10 12:37:39,929] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +16: [2023-05-10 12:37:39,929] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +16: [2023-05-10 12:37:39,929] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +31: [2023-05-10 12:37:39,930] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... + 0: [2023-05-10 12:37:39,930] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt. +31: [2023-05-10 12:37:39,930] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +16: [2023-05-10 12:37:39,930] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt... +16: [2023-05-10 12:37:39,930] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt... + 9: [2023-05-10 12:37:39,930] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +23: [2023-05-10 12:37:39,930] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... + 2: [2023-05-10 12:37:39,930] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... + 4: [2023-05-10 12:37:39,930] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... + 0: [2023-05-10 12:37:39,930] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt. + 0: [2023-05-10 12:37:39,930] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt. + 4: [2023-05-10 12:37:39,930] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... + 4: [2023-05-10 12:37:39,930] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... + 0: [2023-05-10 12:37:39,930] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt. +14: [2023-05-10 12:37:39,931] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +16: [2023-05-10 12:37:39,931] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +16: [2023-05-10 12:37:39,931] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt... + 9: [2023-05-10 12:37:39,931] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... + 1: [2023-05-10 12:37:39,932] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... + 9: [2023-05-10 12:37:39,932] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. + 1: [2023-05-10 12:37:39,932] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +23: [2023-05-10 12:37:39,932] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... + 9: [2023-05-10 12:37:39,932] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +23: [2023-05-10 12:37:39,932] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +11: [2023-05-10 12:37:39,932] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +13: [2023-05-10 12:37:39,932] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +11: [2023-05-10 12:37:39,932] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +11: [2023-05-10 12:37:39,932] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... + 4: [2023-05-10 12:37:39,933] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... + 9: [2023-05-10 12:37:39,933] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... + 1: [2023-05-10 12:37:39,934] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +24: [2023-05-10 12:37:39,934] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... + 2: [2023-05-10 12:37:39,934] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +11: [2023-05-10 12:37:39,935] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +24: [2023-05-10 12:37:39,936] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +16: [2023-05-10 12:37:39,936] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +16: [2023-05-10 12:37:39,936] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt... + 5: [2023-05-10 12:37:39,937] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... + 5: [2023-05-10 12:37:39,938] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... + 7: [2023-05-10 12:37:39,938] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... + 5: [2023-05-10 12:37:39,938] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. + 5: [2023-05-10 12:37:39,938] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. + 1: [2023-05-10 12:37:39,938] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... + 1: [2023-05-10 12:37:39,939] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... + 0: [2023-05-10 12:37:39,939] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +11: [2023-05-10 12:37:39,939] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +21: [2023-05-10 12:37:39,939] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. + 5: [2023-05-10 12:37:39,940] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +21: [2023-05-10 12:37:39,941] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +21: [2023-05-10 12:37:39,941] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +24: [2023-05-10 12:37:39,941] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... + 9: [2023-05-10 12:37:39,941] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +31: [2023-05-10 12:37:39,941] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +13: [2023-05-10 12:37:39,941] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +24: [2023-05-10 12:37:39,941] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +31: [2023-05-10 12:37:39,941] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt... +14: [2023-05-10 12:37:39,941] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... + 5: [2023-05-10 12:37:39,941] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +27: [2023-05-10 12:37:39,942] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt. +27: [2023-05-10 12:37:39,942] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt. +13: [2023-05-10 12:37:39,942] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt. +17: [2023-05-10 12:37:39,942] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +17: [2023-05-10 12:37:39,942] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +17: [2023-05-10 12:37:39,942] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt... +13: [2023-05-10 12:37:39,942] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +13: [2023-05-10 12:37:39,942] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +13: [2023-05-10 12:37:39,943] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt. +24: [2023-05-10 12:37:39,943] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +11: [2023-05-10 12:37:39,942] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +27: [2023-05-10 12:37:39,943] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt. +24: [2023-05-10 12:37:39,943] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +27: [2023-05-10 12:37:39,943] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt. +24: [2023-05-10 12:37:39,943] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt... +24: [2023-05-10 12:37:39,943] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt... +17: [2023-05-10 12:37:39,943] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt... + 8: [2023-05-10 12:37:39,944] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. + 8: [2023-05-10 12:37:39,944] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +24: [2023-05-10 12:37:39,944] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +23: [2023-05-10 12:37:39,944] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +24: [2023-05-10 12:37:39,944] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt... + 8: [2023-05-10 12:37:39,944] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt... + 8: [2023-05-10 12:37:39,944] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt... +23: [2023-05-10 12:37:39,944] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt... + 0: [2023-05-10 12:37:39,945] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... + 7: [2023-05-10 12:37:39,945] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. + 7: [2023-05-10 12:37:39,945] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +18: [2023-05-10 12:37:39,945] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +18: [2023-05-10 12:37:39,945] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +18: [2023-05-10 12:37:39,945] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. + 7: [2023-05-10 12:37:39,946] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt... + 7: [2023-05-10 12:37:39,946] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt... +31: [2023-05-10 12:37:39,946] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +31: [2023-05-10 12:37:39,946] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt... +13: [2023-05-10 12:37:39,946] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt. + 4: [2023-05-10 12:37:39,946] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. + 1: [2023-05-10 12:37:39,946] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. + 4: [2023-05-10 12:37:39,947] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt... + 0: [2023-05-10 12:37:39,946] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... + 0: [2023-05-10 12:37:39,947] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... + 1: [2023-05-10 12:37:39,947] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. + 1: [2023-05-10 12:37:39,947] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt... + 1: [2023-05-10 12:37:39,947] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt... + 4: [2023-05-10 12:37:39,947] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. + 4: [2023-05-10 12:37:39,947] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt... + 9: [2023-05-10 12:37:39,947] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. + 8: [2023-05-10 12:37:39,947] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. + 8: [2023-05-10 12:37:39,947] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt... + 5: [2023-05-10 12:37:39,948] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... + 9: [2023-05-10 12:37:39,948] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt... + 5: [2023-05-10 12:37:39,948] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... + 2: [2023-05-10 12:37:39,948] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +23: [2023-05-10 12:37:39,948] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +23: [2023-05-10 12:37:39,948] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +23: [2023-05-10 12:37:39,948] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt... +23: [2023-05-10 12:37:39,948] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt... +23: [2023-05-10 12:37:39,948] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. + 2: [2023-05-10 12:37:39,948] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt... +31: [2023-05-10 12:37:39,948] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +31: [2023-05-10 12:37:39,948] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt... +23: [2023-05-10 12:37:39,948] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt... + 2: [2023-05-10 12:37:39,949] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +11: [2023-05-10 12:37:39,949] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. + 2: [2023-05-10 12:37:39,949] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt... +11: [2023-05-10 12:37:39,949] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt... + 8: [2023-05-10 12:37:39,950] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +17: [2023-05-10 12:37:39,950] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +17: [2023-05-10 12:37:39,950] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +17: [2023-05-10 12:37:39,950] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt... +17: [2023-05-10 12:37:39,950] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt... + 1: [2023-05-10 12:37:39,950] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. + 7: [2023-05-10 12:37:39,951] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. + 7: [2023-05-10 12:37:39,951] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. + 7: [2023-05-10 12:37:39,951] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt... + 4: [2023-05-10 12:37:39,951] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. + 4: [2023-05-10 12:37:39,951] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt... + 9: [2023-05-10 12:37:39,951] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +24: [2023-05-10 12:37:39,952] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +13: [2023-05-10 12:37:39,951] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt. +13: [2023-05-10 12:37:39,952] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... + 8: [2023-05-10 12:37:39,952] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt... + 2: [2023-05-10 12:37:39,952] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. + 1: [2023-05-10 12:37:39,952] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt... + 2: [2023-05-10 12:37:39,952] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt... + 7: [2023-05-10 12:37:39,952] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt... + 9: [2023-05-10 12:37:39,952] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt... +27: [2023-05-10 12:37:39,953] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +27: [2023-05-10 12:37:39,953] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +27: [2023-05-10 12:37:39,953] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... + 2: [2023-05-10 12:37:39,953] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. + 4: [2023-05-10 12:37:39,953] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +11: [2023-05-10 12:37:39,953] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... + 4: [2023-05-10 12:37:39,953] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt... +21: [2023-05-10 12:37:39,954] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... + 5: [2023-05-10 12:37:39,953] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. + 5: [2023-05-10 12:37:39,953] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. + 3: [2023-05-10 12:37:39,954] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt. + 2: [2023-05-10 12:37:39,954] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt... + 3: [2023-05-10 12:37:39,954] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt. +13: [2023-05-10 12:37:39,954] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +21: [2023-05-10 12:37:39,955] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +27: [2023-05-10 12:37:39,955] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... + 9: [2023-05-10 12:37:39,955] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. + 9: [2023-05-10 12:37:39,955] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt... +18: [2023-05-10 12:37:39,955] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +31: [2023-05-10 12:37:39,956] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +13: [2023-05-10 12:37:39,956] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +13: [2023-05-10 12:37:39,956] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... + 3: [2023-05-10 12:37:39,956] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt. +13: [2023-05-10 12:37:39,956] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +21: [2023-05-10 12:37:39,956] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +24: [2023-05-10 12:37:39,956] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +11: [2023-05-10 12:37:39,956] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +21: [2023-05-10 12:37:39,956] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +11: [2023-05-10 12:37:39,956] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt... +31: [2023-05-10 12:37:39,957] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt... +24: [2023-05-10 12:37:39,958] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt... +11: [2023-05-10 12:37:39,957] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +11: [2023-05-10 12:37:39,958] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt... +11: [2023-05-10 12:37:39,958] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +18: [2023-05-10 12:37:39,959] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +18: [2023-05-10 12:37:39,959] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... + 1: [2023-05-10 12:37:39,960] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. + 1: [2023-05-10 12:37:39,960] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt... + 9: [2023-05-10 12:37:39,960] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. + 3: [2023-05-10 12:37:39,961] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt. + 0: [2023-05-10 12:37:39,961] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. + 5: [2023-05-10 12:37:39,961] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. + 9: [2023-05-10 12:37:39,961] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt... +18: [2023-05-10 12:37:39,961] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. + 0: [2023-05-10 12:37:39,962] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt... +13: [2023-05-10 12:37:39,963] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... + 5: [2023-05-10 12:37:39,963] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt... +15: [2023-05-10 12:37:39,921] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +15: [2023-05-10 12:37:39,922] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +15: [2023-05-10 12:37:39,922] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt... +15: [2023-05-10 12:37:39,922] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +15: [2023-05-10 12:37:39,926] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +15: [2023-05-10 12:37:39,926] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +15: [2023-05-10 12:37:39,926] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +15: [2023-05-10 12:37:39,926] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt... +15: [2023-05-10 12:37:39,926] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt... +15: [2023-05-10 12:37:39,926] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt... +15: [2023-05-10 12:37:39,934] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +15: [2023-05-10 12:37:39,937] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +15: [2023-05-10 12:37:39,940] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +15: [2023-05-10 12:37:39,940] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +15: [2023-05-10 12:37:39,943] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +15: [2023-05-10 12:37:39,949] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +15: [2023-05-10 12:37:39,950] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +15: [2023-05-10 12:37:39,950] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... + 3: [2023-05-10 12:37:39,964] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... + 5: [2023-05-10 12:37:39,964] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. + 5: [2023-05-10 12:37:39,965] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt... +27: [2023-05-10 12:37:39,965] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. + 3: [2023-05-10 12:37:39,965] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... + 3: [2023-05-10 12:37:39,965] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +27: [2023-05-10 12:37:39,966] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +21: [2023-05-10 12:37:39,966] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt. +21: [2023-05-10 12:37:39,966] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt. +27: [2023-05-10 12:37:39,967] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt... +27: [2023-05-10 12:37:39,967] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt... +13: [2023-05-10 12:37:39,967] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +13: [2023-05-10 12:37:39,967] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +13: [2023-05-10 12:37:39,967] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt... + 5: [2023-05-10 12:37:39,968] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... + 5: [2023-05-10 12:37:39,968] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +11: [2023-05-10 12:37:39,968] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. + 5: [2023-05-10 12:37:39,968] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. + 5: [2023-05-10 12:37:39,968] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt... +21: [2023-05-10 12:37:39,969] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +21: [2023-05-10 12:37:39,970] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt. +18: [2023-05-10 12:37:39,970] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +27: [2023-05-10 12:37:39,970] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +27: [2023-05-10 12:37:39,970] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +27: [2023-05-10 12:37:39,971] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt... +27: [2023-05-10 12:37:39,971] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt... + 0: [2023-05-10 12:37:39,970] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. + 3: [2023-05-10 12:37:39,971] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +21: [2023-05-10 12:37:39,971] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_08-model_01-model_states.pt. +11: [2023-05-10 12:37:39,972] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt... +22: [2023-05-10 12:37:39,973] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt. +22: [2023-05-10 12:37:39,973] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt. +22: [2023-05-10 12:37:39,974] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt. + 5: [2023-05-10 12:37:39,974] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. + 5: [2023-05-10 12:37:39,974] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt... +22: [2023-05-10 12:37:39,974] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt. +13: [2023-05-10 12:37:39,975] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +13: [2023-05-10 12:37:39,976] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt... +13: [2023-05-10 12:37:39,976] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... + 0: [2023-05-10 12:37:39,978] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. + 0: [2023-05-10 12:37:39,979] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +13: [2023-05-10 12:37:39,981] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +13: [2023-05-10 12:37:39,981] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt... +21: [2023-05-10 12:37:39,981] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +13: [2023-05-10 12:37:39,982] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +13: [2023-05-10 12:37:39,982] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt... + 3: [2023-05-10 12:37:39,982] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +21: [2023-05-10 12:37:39,983] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +22: [2023-05-10 12:37:39,984] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +22: [2023-05-10 12:37:39,984] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... + 3: [2023-05-10 12:37:39,984] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt... + 3: [2023-05-10 12:37:39,984] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +21: [2023-05-10 12:37:39,984] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... + 3: [2023-05-10 12:37:39,984] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt... +21: [2023-05-10 12:37:39,985] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt... +22: [2023-05-10 12:37:39,985] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... + 3: [2023-05-10 12:37:39,985] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. + 3: [2023-05-10 12:37:39,986] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt... + 3: [2023-05-10 12:37:39,987] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. + 3: [2023-05-10 12:37:39,987] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt... + 0: [2023-05-10 12:37:39,987] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. + 0: [2023-05-10 12:37:39,988] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt... + 0: [2023-05-10 12:37:39,988] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +22: [2023-05-10 12:37:39,988] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... + 0: [2023-05-10 12:37:39,992] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +29: [2023-05-10 12:37:39,992] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt. + 0: [2023-05-10 12:37:39,992] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +29: [2023-05-10 12:37:39,992] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt. +29: [2023-05-10 12:37:39,992] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt. +29: [2023-05-10 12:37:39,993] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt. + 0: [2023-05-10 12:37:39,993] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. + 0: [2023-05-10 12:37:39,995] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. + 0: [2023-05-10 12:37:39,995] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt... + 0: [2023-05-10 12:37:39,995] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. + 0: [2023-05-10 12:37:39,996] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt... +21: [2023-05-10 12:37:39,998] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +21: [2023-05-10 12:37:39,998] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt... +21: [2023-05-10 12:37:40,001] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +21: [2023-05-10 12:37:40,001] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt... +21: [2023-05-10 12:37:40,002] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +21: [2023-05-10 12:37:40,002] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt... +29: [2023-05-10 12:37:40,002] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +29: [2023-05-10 12:37:40,002] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... + 0: [2023-05-10 12:37:40,002] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +29: [2023-05-10 12:37:40,002] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +29: [2023-05-10 12:37:40,003] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +21: [2023-05-10 12:37:40,008] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_00-model_states.pt. +21: [2023-05-10 12:37:40,011] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt... +20: [2023-05-10 12:37:40,014] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt. +20: [2023-05-10 12:37:40,014] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt. +20: [2023-05-10 12:37:40,014] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt. +20: [2023-05-10 12:37:40,015] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt. +20: [2023-05-10 12:37:40,024] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +20: [2023-05-10 12:37:40,024] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +20: [2023-05-10 12:37:40,025] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +20: [2023-05-10 12:37:40,026] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +30: [2023-05-10 12:37:40,068] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt. +30: [2023-05-10 12:37:40,068] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt. +30: [2023-05-10 12:37:40,068] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt. +30: [2023-05-10 12:37:40,069] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt. +26: [2023-05-10 12:37:40,069] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt. +26: [2023-05-10 12:37:40,069] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt. +26: [2023-05-10 12:37:40,069] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt. +26: [2023-05-10 12:37:40,069] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt. +30: [2023-05-10 12:37:40,078] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +30: [2023-05-10 12:37:40,078] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +30: [2023-05-10 12:37:40,078] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +30: [2023-05-10 12:37:40,079] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +26: [2023-05-10 12:37:40,079] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +31: [2023-05-10 12:37:40,080] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +31: [2023-05-10 12:37:40,080] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +31: [2023-05-10 12:37:40,080] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +31: [2023-05-10 12:37:40,081] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +31: [2023-05-10 12:37:40,081] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +31: [2023-05-10 12:37:40,081] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +30: [2023-05-10 12:37:40,081] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +30: [2023-05-10 12:37:40,081] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +30: [2023-05-10 12:37:40,081] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +30: [2023-05-10 12:37:40,081] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +30: [2023-05-10 12:37:40,081] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +30: [2023-05-10 12:37:40,081] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +30: [2023-05-10 12:37:40,081] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +30: [2023-05-10 12:37:40,082] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +31: [2023-05-10 12:37:40,083] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +31: [2023-05-10 12:37:40,083] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +26: [2023-05-10 12:37:40,085] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +26: [2023-05-10 12:37:40,085] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +26: [2023-05-10 12:37:40,085] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... + 6: [2023-05-10 12:37:40,088] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt. + 6: [2023-05-10 12:37:40,088] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt. + 6: [2023-05-10 12:37:40,088] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt. + 6: [2023-05-10 12:37:40,089] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt. +30: [2023-05-10 12:37:40,092] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +30: [2023-05-10 12:37:40,093] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt... +30: [2023-05-10 12:37:40,094] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +30: [2023-05-10 12:37:40,094] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt... + 6: [2023-05-10 12:37:40,097] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +31: [2023-05-10 12:37:40,098] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +31: [2023-05-10 12:37:40,098] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +30: [2023-05-10 12:37:40,099] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. + 6: [2023-05-10 12:37:40,099] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... + 6: [2023-05-10 12:37:40,100] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... + 6: [2023-05-10 12:37:40,100] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +30: [2023-05-10 12:37:40,100] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +26: [2023-05-10 12:37:40,100] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +26: [2023-05-10 12:37:40,100] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +19: [2023-05-10 12:37:40,100] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +19: [2023-05-10 12:37:40,100] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +19: [2023-05-10 12:37:40,100] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +26: [2023-05-10 12:37:40,101] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +19: [2023-05-10 12:37:40,101] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +19: [2023-05-10 12:37:40,101] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +26: [2023-05-10 12:37:40,101] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +19: [2023-05-10 12:37:40,101] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... + 4: [2023-05-10 12:37:40,101] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +19: [2023-05-10 12:37:40,101] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt. +19: [2023-05-10 12:37:40,101] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt. + 4: [2023-05-10 12:37:40,101] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... + 4: [2023-05-10 12:37:40,101] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. + 4: [2023-05-10 12:37:40,101] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +19: [2023-05-10 12:37:40,101] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +19: [2023-05-10 12:37:40,101] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt. +19: [2023-05-10 12:37:40,101] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +26: [2023-05-10 12:37:40,101] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt... +26: [2023-05-10 12:37:40,101] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +26: [2023-05-10 12:37:40,101] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. + 4: [2023-05-10 12:37:40,101] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... + 4: [2023-05-10 12:37:40,101] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... + 3: [2023-05-10 12:37:40,101] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +19: [2023-05-10 12:37:40,101] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt. + 3: [2023-05-10 12:37:40,101] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... + 4: [2023-05-10 12:37:40,101] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +26: [2023-05-10 12:37:40,101] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... + 4: [2023-05-10 12:37:40,101] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... + 3: [2023-05-10 12:37:40,101] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. + 3: [2023-05-10 12:37:40,101] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. + 3: [2023-05-10 12:37:40,101] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. + 3: [2023-05-10 12:37:40,102] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +30: [2023-05-10 12:37:40,102] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt... +26: [2023-05-10 12:37:40,102] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... + 3: [2023-05-10 12:37:40,103] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... + 3: [2023-05-10 12:37:40,103] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +30: [2023-05-10 12:37:40,104] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +30: [2023-05-10 12:37:40,104] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +26: [2023-05-10 12:37:40,105] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +30: [2023-05-10 12:37:40,107] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +31: [2023-05-10 12:37:40,107] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +31: [2023-05-10 12:37:40,107] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +26: [2023-05-10 12:37:40,108] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +26: [2023-05-10 12:37:40,108] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt... +30: [2023-05-10 12:37:40,109] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +30: [2023-05-10 12:37:40,109] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt... +30: [2023-05-10 12:37:40,110] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +31: [2023-05-10 12:37:40,110] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +26: [2023-05-10 12:37:40,112] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +19: [2023-05-10 12:37:40,112] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +19: [2023-05-10 12:37:40,113] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +19: [2023-05-10 12:37:40,113] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... + 4: [2023-05-10 12:37:40,113] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +19: [2023-05-10 12:37:40,114] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... + 3: [2023-05-10 12:37:40,113] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +31: [2023-05-10 12:37:40,114] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +30: [2023-05-10 12:37:40,115] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +30: [2023-05-10 12:37:40,115] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +30: [2023-05-10 12:37:40,116] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +29: [2023-05-10 12:37:40,117] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +29: [2023-05-10 12:37:40,117] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +29: [2023-05-10 12:37:40,118] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +29: [2023-05-10 12:37:40,118] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +29: [2023-05-10 12:37:40,118] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +29: [2023-05-10 12:37:40,118] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +29: [2023-05-10 12:37:40,118] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +29: [2023-05-10 12:37:40,118] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +29: [2023-05-10 12:37:40,118] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +29: [2023-05-10 12:37:40,118] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +29: [2023-05-10 12:37:40,118] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +29: [2023-05-10 12:37:40,118] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt... +29: [2023-05-10 12:37:40,118] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt... +29: [2023-05-10 12:37:40,118] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt... +29: [2023-05-10 12:37:40,118] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt... + 3: [2023-05-10 12:37:40,119] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. + 4: [2023-05-10 12:37:40,119] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +31: [2023-05-10 12:37:40,119] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... + 4: [2023-05-10 12:37:40,119] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. + 4: [2023-05-10 12:37:40,119] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +26: [2023-05-10 12:37:40,120] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +19: [2023-05-10 12:37:40,120] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +29: [2023-05-10 12:37:40,120] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +26: [2023-05-10 12:37:40,121] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +26: [2023-05-10 12:37:40,121] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +26: [2023-05-10 12:37:40,122] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt... +19: [2023-05-10 12:37:40,122] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +19: [2023-05-10 12:37:40,122] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +19: [2023-05-10 12:37:40,123] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. + 3: [2023-05-10 12:37:40,123] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +31: [2023-05-10 12:37:40,124] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... + 4: [2023-05-10 12:37:40,124] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +28: [2023-05-10 12:37:40,125] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt. +28: [2023-05-10 12:37:40,125] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt. +28: [2023-05-10 12:37:40,125] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt. +26: [2023-05-10 12:37:40,125] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +28: [2023-05-10 12:37:40,125] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt. +22: [2023-05-10 12:37:40,126] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +22: [2023-05-10 12:37:40,126] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +22: [2023-05-10 12:37:40,127] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +22: [2023-05-10 12:37:40,127] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt... +22: [2023-05-10 12:37:40,127] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +22: [2023-05-10 12:37:40,127] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +22: [2023-05-10 12:37:40,127] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +22: [2023-05-10 12:37:40,127] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +22: [2023-05-10 12:37:40,127] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +22: [2023-05-10 12:37:40,127] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +22: [2023-05-10 12:37:40,127] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt... +22: [2023-05-10 12:37:40,127] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt... +22: [2023-05-10 12:37:40,127] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +22: [2023-05-10 12:37:40,127] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +22: [2023-05-10 12:37:40,127] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... + 3: [2023-05-10 12:37:40,128] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +22: [2023-05-10 12:37:40,129] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt... +26: [2023-05-10 12:37:40,128] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt... +20: [2023-05-10 12:37:40,129] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +20: [2023-05-10 12:37:40,129] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +20: [2023-05-10 12:37:40,129] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +20: [2023-05-10 12:37:40,129] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +20: [2023-05-10 12:37:40,129] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +20: [2023-05-10 12:37:40,129] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +20: [2023-05-10 12:37:40,129] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +28: [2023-05-10 12:37:40,129] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +20: [2023-05-10 12:37:40,129] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +20: [2023-05-10 12:37:40,129] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +28: [2023-05-10 12:37:40,130] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +20: [2023-05-10 12:37:40,130] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +20: [2023-05-10 12:37:40,130] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +20: [2023-05-10 12:37:40,130] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +20: [2023-05-10 12:37:40,130] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt... +20: [2023-05-10 12:37:40,130] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt... +20: [2023-05-10 12:37:40,130] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt... +28: [2023-05-10 12:37:40,130] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +28: [2023-05-10 12:37:40,130] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +28: [2023-05-10 12:37:40,130] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +28: [2023-05-10 12:37:40,130] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +28: [2023-05-10 12:37:40,130] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +26: [2023-05-10 12:37:40,130] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... + 4: [2023-05-10 12:37:40,130] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +29: [2023-05-10 12:37:40,130] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +26: [2023-05-10 12:37:40,130] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +20: [2023-05-10 12:37:40,131] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt... +29: [2023-05-10 12:37:40,131] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +29: [2023-05-10 12:37:40,131] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. + 4: [2023-05-10 12:37:40,132] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +19: [2023-05-10 12:37:40,132] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +19: [2023-05-10 12:37:40,132] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. + 4: [2023-05-10 12:37:40,132] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +19: [2023-05-10 12:37:40,132] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt... +28: [2023-05-10 12:37:40,134] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +19: [2023-05-10 12:37:40,134] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +19: [2023-05-10 12:37:40,135] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +28: [2023-05-10 12:37:40,135] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... + 3: [2023-05-10 12:37:40,136] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. + 3: [2023-05-10 12:37:40,137] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +22: [2023-05-10 12:37:40,138] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +16: [2023-05-10 12:37:40,138] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +16: [2023-05-10 12:37:40,138] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +16: [2023-05-10 12:37:40,138] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +16: [2023-05-10 12:37:40,138] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +16: [2023-05-10 12:37:40,138] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +16: [2023-05-10 12:37:40,138] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +28: [2023-05-10 12:37:40,138] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +16: [2023-05-10 12:37:40,138] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +19: [2023-05-10 12:37:40,138] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +16: [2023-05-10 12:37:40,139] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +26: [2023-05-10 12:37:40,139] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +28: [2023-05-10 12:37:40,139] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +12: [2023-05-10 12:37:40,139] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +12: [2023-05-10 12:37:40,139] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +12: [2023-05-10 12:37:40,139] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +12: [2023-05-10 12:37:40,139] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +12: [2023-05-10 12:37:40,139] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +28: [2023-05-10 12:37:40,139] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +12: [2023-05-10 12:37:40,139] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... + 6: [2023-05-10 12:37:40,138] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. + 6: [2023-05-10 12:37:40,138] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. + 6: [2023-05-10 12:37:40,138] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. + 6: [2023-05-10 12:37:40,138] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. + 6: [2023-05-10 12:37:40,139] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. + 6: [2023-05-10 12:37:40,139] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. + 6: [2023-05-10 12:37:40,139] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. + 6: [2023-05-10 12:37:40,139] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... + 6: [2023-05-10 12:37:40,139] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... + 6: [2023-05-10 12:37:40,139] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. + 6: [2023-05-10 12:37:40,139] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... + 6: [2023-05-10 12:37:40,139] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt... + 6: [2023-05-10 12:37:40,139] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt... + 6: [2023-05-10 12:37:40,139] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt... + 6: [2023-05-10 12:37:40,139] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt... +12: [2023-05-10 12:37:40,140] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. + 6: [2023-05-10 12:37:40,141] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +12: [2023-05-10 12:37:40,142] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +19: [2023-05-10 12:37:40,142] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +19: [2023-05-10 12:37:40,142] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt... +20: [2023-05-10 12:37:40,142] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +20: [2023-05-10 12:37:40,143] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +26: [2023-05-10 12:37:40,143] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +29: [2023-05-10 12:37:40,144] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +29: [2023-05-10 12:37:40,144] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +20: [2023-05-10 12:37:40,145] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +20: [2023-05-10 12:37:40,145] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. + 3: [2023-05-10 12:37:40,146] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... + 3: [2023-05-10 12:37:40,146] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +29: [2023-05-10 12:37:40,146] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +22: [2023-05-10 12:37:40,146] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +22: [2023-05-10 12:37:40,146] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +22: [2023-05-10 12:37:40,147] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +22: [2023-05-10 12:37:40,147] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +18: [2023-05-10 12:37:40,148] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt. +18: [2023-05-10 12:37:40,148] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt. +18: [2023-05-10 12:37:40,148] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt. +18: [2023-05-10 12:37:40,148] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt. +19: [2023-05-10 12:37:40,149] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +19: [2023-05-10 12:37:40,149] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +19: [2023-05-10 12:37:40,150] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt... +28: [2023-05-10 12:37:40,150] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +19: [2023-05-10 12:37:40,151] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt... +16: [2023-05-10 12:37:40,151] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +16: [2023-05-10 12:37:40,152] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +29: [2023-05-10 12:37:40,152] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +26: [2023-05-10 12:37:40,152] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +28: [2023-05-10 12:37:40,152] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +28: [2023-05-10 12:37:40,153] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt... +20: [2023-05-10 12:37:40,153] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +20: [2023-05-10 12:37:40,153] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... + 6: [2023-05-10 12:37:40,153] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +20: [2023-05-10 12:37:40,154] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +20: [2023-05-10 12:37:40,154] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +12: [2023-05-10 12:37:40,154] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +28: [2023-05-10 12:37:40,155] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +28: [2023-05-10 12:37:40,156] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +28: [2023-05-10 12:37:40,156] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt... +22: [2023-05-10 12:37:40,156] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +16: [2023-05-10 12:37:40,156] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +16: [2023-05-10 12:37:40,156] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. + 6: [2023-05-10 12:37:40,156] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. + 6: [2023-05-10 12:37:40,156] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +22: [2023-05-10 12:37:40,156] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +12: [2023-05-10 12:37:40,157] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +22: [2023-05-10 12:37:40,157] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +18: [2023-05-10 12:37:40,158] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +18: [2023-05-10 12:37:40,158] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +28: [2023-05-10 12:37:40,158] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +28: [2023-05-10 12:37:40,158] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt... +18: [2023-05-10 12:37:40,160] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +28: [2023-05-10 12:37:40,159] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +16: [2023-05-10 12:37:40,160] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +12: [2023-05-10 12:37:40,160] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt. +12: [2023-05-10 12:37:40,160] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt. +18: [2023-05-10 12:37:40,160] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +12: [2023-05-10 12:37:40,160] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt. +12: [2023-05-10 12:37:40,161] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt. +29: [2023-05-10 12:37:40,161] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... + 6: [2023-05-10 12:37:40,164] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +16: [2023-05-10 12:37:40,163] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... + 6: [2023-05-10 12:37:40,165] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +28: [2023-05-10 12:37:40,165] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +16: [2023-05-10 12:37:40,165] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +12: [2023-05-10 12:37:40,165] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +16: [2023-05-10 12:37:40,166] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +12: [2023-05-10 12:37:40,166] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... + 6: [2023-05-10 12:37:40,167] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +12: [2023-05-10 12:37:40,167] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +28: [2023-05-10 12:37:40,168] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +28: [2023-05-10 12:37:40,168] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt... +28: [2023-05-10 12:37:40,168] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +12: [2023-05-10 12:37:40,171] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +12: [2023-05-10 12:37:40,171] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +23: [2023-05-10 12:37:40,171] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +23: [2023-05-10 12:37:40,171] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +28: [2023-05-10 12:37:40,171] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +23: [2023-05-10 12:37:40,171] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +23: [2023-05-10 12:37:40,172] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +12: [2023-05-10 12:37:40,172] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +23: [2023-05-10 12:37:40,172] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +23: [2023-05-10 12:37:40,172] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +23: [2023-05-10 12:37:40,172] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +12: [2023-05-10 12:37:40,172] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... + 6: [2023-05-10 12:37:40,173] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +23: [2023-05-10 12:37:40,173] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +12: [2023-05-10 12:37:40,176] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +28: [2023-05-10 12:37:40,176] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +12: [2023-05-10 12:37:40,181] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. + 6: [2023-05-10 12:37:40,182] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +12: [2023-05-10 12:37:40,183] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +23: [2023-05-10 12:37:40,183] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +12: [2023-05-10 12:37:40,184] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt... +23: [2023-05-10 12:37:40,185] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +23: [2023-05-10 12:37:40,185] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +28: [2023-05-10 12:37:40,186] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +12: [2023-05-10 12:37:40,188] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +12: [2023-05-10 12:37:40,188] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt... +12: [2023-05-10 12:37:40,189] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +12: [2023-05-10 12:37:40,189] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt... +12: [2023-05-10 12:37:40,190] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +23: [2023-05-10 12:37:40,193] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +23: [2023-05-10 12:37:40,194] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +23: [2023-05-10 12:37:40,196] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +12: [2023-05-10 12:37:40,199] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +12: [2023-05-10 12:37:40,200] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt... +23: [2023-05-10 12:37:40,206] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. + 1: [2023-05-10 12:37:40,206] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. + 1: [2023-05-10 12:37:40,206] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. + 1: [2023-05-10 12:37:40,206] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... + 1: [2023-05-10 12:37:40,207] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. + 1: [2023-05-10 12:37:40,207] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... + 1: [2023-05-10 12:37:40,207] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. + 1: [2023-05-10 12:37:40,209] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... + 1: [2023-05-10 12:37:40,209] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +10: [2023-05-10 12:37:40,209] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +10: [2023-05-10 12:37:40,209] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +10: [2023-05-10 12:37:40,209] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +10: [2023-05-10 12:37:40,210] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +10: [2023-05-10 12:37:40,210] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +10: [2023-05-10 12:37:40,210] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +10: [2023-05-10 12:37:40,210] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +10: [2023-05-10 12:37:40,213] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +23: [2023-05-10 12:37:40,215] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +31: [2023-05-10 12:37:40,218] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt. +31: [2023-05-10 12:37:40,218] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt. +31: [2023-05-10 12:37:40,218] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt. +31: [2023-05-10 12:37:40,218] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt. + 1: [2023-05-10 12:37:40,220] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. + 1: [2023-05-10 12:37:40,221] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +10: [2023-05-10 12:37:40,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +10: [2023-05-10 12:37:40,226] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +10: [2023-05-10 12:37:40,227] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +31: [2023-05-10 12:37:40,228] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +31: [2023-05-10 12:37:40,228] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +31: [2023-05-10 12:37:40,229] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +31: [2023-05-10 12:37:40,229] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... + 1: [2023-05-10 12:37:40,231] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +10: [2023-05-10 12:37:40,232] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... + 1: [2023-05-10 12:37:40,233] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +14: [2023-05-10 12:37:40,233] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +14: [2023-05-10 12:37:40,233] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +14: [2023-05-10 12:37:40,233] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +14: [2023-05-10 12:37:40,233] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... + 2: [2023-05-10 12:37:40,233] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. + 2: [2023-05-10 12:37:40,233] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. + 2: [2023-05-10 12:37:40,233] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... + 2: [2023-05-10 12:37:40,233] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... + 2: [2023-05-10 12:37:40,234] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. + 2: [2023-05-10 12:37:40,234] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +16: [2023-05-10 12:37:40,234] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt. +16: [2023-05-10 12:37:40,234] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt. +16: [2023-05-10 12:37:40,234] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt. + 2: [2023-05-10 12:37:40,234] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +27: [2023-05-10 12:37:40,234] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +27: [2023-05-10 12:37:40,234] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +16: [2023-05-10 12:37:40,234] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt. +27: [2023-05-10 12:37:40,234] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +27: [2023-05-10 12:37:40,234] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +14: [2023-05-10 12:37:40,234] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +14: [2023-05-10 12:37:40,234] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +25: [2023-05-10 12:37:40,234] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +25: [2023-05-10 12:37:40,235] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +25: [2023-05-10 12:37:40,235] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +25: [2023-05-10 12:37:40,235] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +25: [2023-05-10 12:37:40,235] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +25: [2023-05-10 12:37:40,235] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +25: [2023-05-10 12:37:40,235] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. + 0: [2023-05-10 12:37:40,235] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt. +27: [2023-05-10 12:37:40,235] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +27: [2023-05-10 12:37:40,235] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... + 2: [2023-05-10 12:37:40,235] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +27: [2023-05-10 12:37:40,235] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. + 8: [2023-05-10 12:37:40,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. + 8: [2023-05-10 12:37:40,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. + 8: [2023-05-10 12:37:40,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. + 8: [2023-05-10 12:37:40,236] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... + 8: [2023-05-10 12:37:40,236] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... + 8: [2023-05-10 12:37:40,236] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +14: [2023-05-10 12:37:40,236] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... + 8: [2023-05-10 12:37:40,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. + 8: [2023-05-10 12:37:40,236] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... + 7: [2023-05-10 12:37:40,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. + 7: [2023-05-10 12:37:40,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. + 7: [2023-05-10 12:37:40,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. + 7: [2023-05-10 12:37:40,236] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... + 7: [2023-05-10 12:37:40,236] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... + 7: [2023-05-10 12:37:40,236] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... + 7: [2023-05-10 12:37:40,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. + 7: [2023-05-10 12:37:40,236] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +25: [2023-05-10 12:37:40,237] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +10: [2023-05-10 12:37:40,237] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +14: [2023-05-10 12:37:40,237] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... + 0: [2023-05-10 12:37:40,238] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt. + 0: [2023-05-10 12:37:40,238] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt. + 0: [2023-05-10 12:37:40,238] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt. +27: [2023-05-10 12:37:40,239] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +15: [2023-05-10 12:37:40,239] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt. +15: [2023-05-10 12:37:40,239] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt. +15: [2023-05-10 12:37:40,240] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt. + 1: [2023-05-10 12:37:40,240] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +10: [2023-05-10 12:37:40,240] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +15: [2023-05-10 12:37:40,240] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt. + 1: [2023-05-10 12:37:40,242] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +16: [2023-05-10 12:37:40,243] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +16: [2023-05-10 12:37:40,243] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +16: [2023-05-10 12:37:40,243] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +16: [2023-05-10 12:37:40,245] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... + 2: [2023-05-10 12:37:40,245] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. + 2: [2023-05-10 12:37:40,245] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +25: [2023-05-10 12:37:40,246] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +27: [2023-05-10 12:37:40,246] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +27: [2023-05-10 12:37:40,246] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +27: [2023-05-10 12:37:40,246] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +31: [2023-05-10 12:37:40,246] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +31: [2023-05-10 12:37:40,246] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +31: [2023-05-10 12:37:40,247] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +25: [2023-05-10 12:37:40,247] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +31: [2023-05-10 12:37:40,247] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt... +31: [2023-05-10 12:37:40,247] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt... +31: [2023-05-10 12:37:40,247] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt... + 0: [2023-05-10 12:37:40,247] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... + 2: [2023-05-10 12:37:40,247] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +25: [2023-05-10 12:37:40,248] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. + 8: [2023-05-10 12:37:40,248] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +14: [2023-05-10 12:37:40,248] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +14: [2023-05-10 12:37:40,248] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. + 1: [2023-05-10 12:37:40,249] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +15: [2023-05-10 12:37:40,249] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... + 7: [2023-05-10 12:37:40,249] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +10: [2023-05-10 12:37:40,250] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +15: [2023-05-10 12:37:40,251] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +15: [2023-05-10 12:37:40,251] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... + 1: [2023-05-10 12:37:40,251] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... + 0: [2023-05-10 12:37:40,251] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... + 0: [2023-05-10 12:37:40,251] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... + 0: [2023-05-10 12:37:40,251] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +15: [2023-05-10 12:37:40,252] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... + 2: [2023-05-10 12:37:40,254] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... + 2: [2023-05-10 12:37:40,254] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +25: [2023-05-10 12:37:40,255] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +27: [2023-05-10 12:37:40,255] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... + 8: [2023-05-10 12:37:40,255] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. + 8: [2023-05-10 12:37:40,255] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. + 8: [2023-05-10 12:37:40,255] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +31: [2023-05-10 12:37:40,256] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. + 7: [2023-05-10 12:37:40,256] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. + 7: [2023-05-10 12:37:40,256] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. + 7: [2023-05-10 12:37:40,256] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. + 8: [2023-05-10 12:37:40,258] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +25: [2023-05-10 12:37:40,258] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +25: [2023-05-10 12:37:40,258] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +31: [2023-05-10 12:37:40,258] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt... +27: [2023-05-10 12:37:40,258] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +16: [2023-05-10 12:37:40,258] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +16: [2023-05-10 12:37:40,258] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +16: [2023-05-10 12:37:40,258] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +14: [2023-05-10 12:37:40,258] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... + 2: [2023-05-10 12:37:40,259] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +16: [2023-05-10 12:37:40,259] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt... +16: [2023-05-10 12:37:40,259] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt... +16: [2023-05-10 12:37:40,259] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt... +14: [2023-05-10 12:37:40,259] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... + 7: [2023-05-10 12:37:40,259] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +14: [2023-05-10 12:37:40,260] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +27: [2023-05-10 12:37:40,260] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +10: [2023-05-10 12:37:40,262] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +17: [2023-05-10 12:37:40,264] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +17: [2023-05-10 12:37:40,264] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +17: [2023-05-10 12:37:40,264] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +17: [2023-05-10 12:37:40,264] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +17: [2023-05-10 12:37:40,264] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +17: [2023-05-10 12:37:40,264] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +17: [2023-05-10 12:37:40,265] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... + 8: [2023-05-10 12:37:40,265] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +14: [2023-05-10 12:37:40,266] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +17: [2023-05-10 12:37:40,266] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... + 7: [2023-05-10 12:37:40,267] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... + 7: [2023-05-10 12:37:40,267] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... + 2: [2023-05-10 12:37:40,267] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. + 7: [2023-05-10 12:37:40,267] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +25: [2023-05-10 12:37:40,268] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. + 8: [2023-05-10 12:37:40,267] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... + 8: [2023-05-10 12:37:40,268] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +21: [2023-05-10 12:37:40,270] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +21: [2023-05-10 12:37:40,270] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +21: [2023-05-10 12:37:40,270] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +21: [2023-05-10 12:37:40,270] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +21: [2023-05-10 12:37:40,270] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +16: [2023-05-10 12:37:40,270] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +21: [2023-05-10 12:37:40,270] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +14: [2023-05-10 12:37:40,270] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +21: [2023-05-10 12:37:40,271] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +15: [2023-05-10 12:37:40,271] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +21: [2023-05-10 12:37:40,271] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +15: [2023-05-10 12:37:40,271] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +15: [2023-05-10 12:37:40,271] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +15: [2023-05-10 12:37:40,271] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +27: [2023-05-10 12:37:40,271] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +15: [2023-05-10 12:37:40,271] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +15: [2023-05-10 12:37:40,271] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +15: [2023-05-10 12:37:40,271] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +15: [2023-05-10 12:37:40,271] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +15: [2023-05-10 12:37:40,271] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt... +15: [2023-05-10 12:37:40,271] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +24: [2023-05-10 12:37:40,271] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +24: [2023-05-10 12:37:40,271] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +15: [2023-05-10 12:37:40,271] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt... +24: [2023-05-10 12:37:40,271] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +15: [2023-05-10 12:37:40,271] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt... +24: [2023-05-10 12:37:40,271] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +15: [2023-05-10 12:37:40,271] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +15: [2023-05-10 12:37:40,271] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +16: [2023-05-10 12:37:40,272] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt... +24: [2023-05-10 12:37:40,272] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +24: [2023-05-10 12:37:40,272] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +24: [2023-05-10 12:37:40,272] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +24: [2023-05-10 12:37:40,273] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +13: [2023-05-10 12:37:40,274] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +13: [2023-05-10 12:37:40,274] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +13: [2023-05-10 12:37:40,274] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +13: [2023-05-10 12:37:40,274] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +13: [2023-05-10 12:37:40,274] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +13: [2023-05-10 12:37:40,274] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +13: [2023-05-10 12:37:40,274] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +13: [2023-05-10 12:37:40,274] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... + 5: [2023-05-10 12:37:40,275] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. + 5: [2023-05-10 12:37:40,275] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. + 5: [2023-05-10 12:37:40,275] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... + 5: [2023-05-10 12:37:40,275] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... + 5: [2023-05-10 12:37:40,275] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. + 5: [2023-05-10 12:37:40,276] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... + 5: [2023-05-10 12:37:40,276] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +14: [2023-05-10 12:37:40,276] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +17: [2023-05-10 12:37:40,276] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. + 2: [2023-05-10 12:37:40,276] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +11: [2023-05-10 12:37:40,277] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. + 5: [2023-05-10 12:37:40,277] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +11: [2023-05-10 12:37:40,277] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +25: [2023-05-10 12:37:40,277] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +11: [2023-05-10 12:37:40,279] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +11: [2023-05-10 12:37:40,279] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... + 0: [2023-05-10 12:37:40,280] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +17: [2023-05-10 12:37:40,280] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +17: [2023-05-10 12:37:40,280] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +11: [2023-05-10 12:37:40,280] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +11: [2023-05-10 12:37:40,280] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. + 0: [2023-05-10 12:37:40,280] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt... +11: [2023-05-10 12:37:40,280] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +27: [2023-05-10 12:37:40,281] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... + 0: [2023-05-10 12:37:40,281] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. + 0: [2023-05-10 12:37:40,281] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... + 9: [2023-05-10 12:37:40,282] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. + 9: [2023-05-10 12:37:40,282] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. + 9: [2023-05-10 12:37:40,282] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. + 9: [2023-05-10 12:37:40,282] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... + 9: [2023-05-10 12:37:40,282] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... + 9: [2023-05-10 12:37:40,282] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... + 9: [2023-05-10 12:37:40,282] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +24: [2023-05-10 12:37:40,283] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. + 0: [2023-05-10 12:37:40,283] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. + 0: [2023-05-10 12:37:40,283] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. + 0: [2023-05-10 12:37:40,283] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. + 0: [2023-05-10 12:37:40,283] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt... + 0: [2023-05-10 12:37:40,283] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt... + 0: [2023-05-10 12:37:40,283] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +11: [2023-05-10 12:37:40,283] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +15: [2023-05-10 12:37:40,283] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +24: [2023-05-10 12:37:40,284] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +15: [2023-05-10 12:37:40,284] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. + 0: [2023-05-10 12:37:40,284] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. + 0: [2023-05-10 12:37:40,284] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. + 0: [2023-05-10 12:37:40,284] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... + 0: [2023-05-10 12:37:40,284] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... + 9: [2023-05-10 12:37:40,284] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +13: [2023-05-10 12:37:40,284] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +24: [2023-05-10 12:37:40,284] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +17: [2023-05-10 12:37:40,285] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +21: [2023-05-10 12:37:40,285] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +21: [2023-05-10 12:37:40,286] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +15: [2023-05-10 12:37:40,286] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt... +21: [2023-05-10 12:37:40,287] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +21: [2023-05-10 12:37:40,287] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +15: [2023-05-10 12:37:40,288] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. + 0: [2023-05-10 12:37:40,289] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. + 5: [2023-05-10 12:37:40,289] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. + 0: [2023-05-10 12:37:40,289] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt... +17: [2023-05-10 12:37:40,290] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +17: [2023-05-10 12:37:40,291] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... + 5: [2023-05-10 12:37:40,291] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. + 5: [2023-05-10 12:37:40,291] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +15: [2023-05-10 12:37:40,291] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +11: [2023-05-10 12:37:40,292] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +15: [2023-05-10 12:37:40,292] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +24: [2023-05-10 12:37:40,292] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +24: [2023-05-10 12:37:40,292] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +13: [2023-05-10 12:37:40,293] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +13: [2023-05-10 12:37:40,293] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +13: [2023-05-10 12:37:40,293] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +15: [2023-05-10 12:37:40,293] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +11: [2023-05-10 12:37:40,293] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +17: [2023-05-10 12:37:40,294] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +24: [2023-05-10 12:37:40,294] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +11: [2023-05-10 12:37:40,294] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. + 9: [2023-05-10 12:37:40,295] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. + 9: [2023-05-10 12:37:40,296] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +15: [2023-05-10 12:37:40,298] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +18: [2023-05-10 12:37:40,299] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. + 5: [2023-05-10 12:37:40,299] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +21: [2023-05-10 12:37:40,299] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +18: [2023-05-10 12:37:40,299] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +18: [2023-05-10 12:37:40,299] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +18: [2023-05-10 12:37:40,299] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt... +13: [2023-05-10 12:37:40,300] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. + 5: [2023-05-10 12:37:40,300] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +21: [2023-05-10 12:37:40,300] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +15: [2023-05-10 12:37:40,301] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... + 9: [2023-05-10 12:37:40,301] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. + 5: [2023-05-10 12:37:40,302] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +21: [2023-05-10 12:37:40,302] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +13: [2023-05-10 12:37:40,302] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +17: [2023-05-10 12:37:40,302] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +15: [2023-05-10 12:37:40,302] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +21: [2023-05-10 12:37:40,303] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +18: [2023-05-10 12:37:40,303] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +24: [2023-05-10 12:37:40,304] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. + 9: [2023-05-10 12:37:40,304] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +18: [2023-05-10 12:37:40,305] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +18: [2023-05-10 12:37:40,305] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +18: [2023-05-10 12:37:40,305] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +18: [2023-05-10 12:37:40,305] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +18: [2023-05-10 12:37:40,305] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt... +18: [2023-05-10 12:37:40,305] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +18: [2023-05-10 12:37:40,305] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +13: [2023-05-10 12:37:40,305] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +18: [2023-05-10 12:37:40,305] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt... + 9: [2023-05-10 12:37:40,306] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +11: [2023-05-10 12:37:40,306] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... + 5: [2023-05-10 12:37:40,308] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +18: [2023-05-10 12:37:40,308] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +18: [2023-05-10 12:37:40,308] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +18: [2023-05-10 12:37:40,309] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt... +13: [2023-05-10 12:37:40,309] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +11: [2023-05-10 12:37:40,309] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... + 0: [2023-05-10 12:37:40,311] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. + 0: [2023-05-10 12:37:40,311] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. + 9: [2023-05-10 12:37:40,311] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +11: [2023-05-10 12:37:40,311] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +14: [2023-05-10 12:37:40,312] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt. +14: [2023-05-10 12:37:40,312] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt. +14: [2023-05-10 12:37:40,312] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt. +14: [2023-05-10 12:37:40,312] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt. +25: [2023-05-10 12:37:40,313] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt. +24: [2023-05-10 12:37:40,313] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... + 5: [2023-05-10 12:37:40,313] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt. +25: [2023-05-10 12:37:40,313] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt. +25: [2023-05-10 12:37:40,313] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt. +25: [2023-05-10 12:37:40,313] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt. + 5: [2023-05-10 12:37:40,313] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt. + 5: [2023-05-10 12:37:40,314] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt. + 5: [2023-05-10 12:37:40,314] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt. +10: [2023-05-10 12:37:40,314] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt. + 0: [2023-05-10 12:37:40,314] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +10: [2023-05-10 12:37:40,314] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt. +10: [2023-05-10 12:37:40,314] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt. +10: [2023-05-10 12:37:40,314] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt. +11: [2023-05-10 12:37:40,315] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +21: [2023-05-10 12:37:40,315] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt. +21: [2023-05-10 12:37:40,315] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt. +21: [2023-05-10 12:37:40,315] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt. +21: [2023-05-10 12:37:40,315] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt. + 9: [2023-05-10 12:37:40,316] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. + 7: [2023-05-10 12:37:40,316] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt. +27: [2023-05-10 12:37:40,315] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt. +27: [2023-05-10 12:37:40,316] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt. +27: [2023-05-10 12:37:40,316] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt. + 7: [2023-05-10 12:37:40,316] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt. + 7: [2023-05-10 12:37:40,316] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt. +27: [2023-05-10 12:37:40,316] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt. + 7: [2023-05-10 12:37:40,316] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt. +17: [2023-05-10 12:37:40,316] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt. +17: [2023-05-10 12:37:40,316] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt. +17: [2023-05-10 12:37:40,316] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt. + 4: [2023-05-10 12:37:40,316] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt. + 4: [2023-05-10 12:37:40,316] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt. + 4: [2023-05-10 12:37:40,316] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt. +17: [2023-05-10 12:37:40,316] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt. + 4: [2023-05-10 12:37:40,317] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt. + 5: [2023-05-10 12:37:40,318] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... + 9: [2023-05-10 12:37:40,319] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt. + 9: [2023-05-10 12:37:40,319] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt. + 9: [2023-05-10 12:37:40,320] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt. + 9: [2023-05-10 12:37:40,320] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt. + 0: [2023-05-10 12:37:40,322] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +14: [2023-05-10 12:37:40,322] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +14: [2023-05-10 12:37:40,323] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +25: [2023-05-10 12:37:40,323] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... + 0: [2023-05-10 12:37:40,323] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +14: [2023-05-10 12:37:40,323] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +18: [2023-05-10 12:37:40,323] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. + 0: [2023-05-10 12:37:40,324] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... + 5: [2023-05-10 12:37:40,324] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +25: [2023-05-10 12:37:40,324] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +25: [2023-05-10 12:37:40,324] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +25: [2023-05-10 12:37:40,324] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... + 0: [2023-05-10 12:37:40,325] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +10: [2023-05-10 12:37:40,325] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +10: [2023-05-10 12:37:40,325] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... + 5: [2023-05-10 12:37:40,325] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... + 7: [2023-05-10 12:37:40,325] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... + 7: [2023-05-10 12:37:40,325] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... + 5: [2023-05-10 12:37:40,325] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... + 5: [2023-05-10 12:37:40,325] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... + 7: [2023-05-10 12:37:40,326] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +17: [2023-05-10 12:37:40,326] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +17: [2023-05-10 12:37:40,326] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... + 7: [2023-05-10 12:37:40,326] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +10: [2023-05-10 12:37:40,326] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +17: [2023-05-10 12:37:40,326] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +17: [2023-05-10 12:37:40,327] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +18: [2023-05-10 12:37:40,327] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. + 4: [2023-05-10 12:37:40,327] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +21: [2023-05-10 12:37:40,327] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +27: [2023-05-10 12:37:40,327] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +10: [2023-05-10 12:37:40,328] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +14: [2023-05-10 12:37:40,328] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... + 4: [2023-05-10 12:37:40,328] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... + 4: [2023-05-10 12:37:40,328] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... + 4: [2023-05-10 12:37:40,328] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +27: [2023-05-10 12:37:40,328] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... + 9: [2023-05-10 12:37:40,329] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +26: [2023-05-10 12:37:40,329] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt. +26: [2023-05-10 12:37:40,329] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt. +26: [2023-05-10 12:37:40,329] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt. + 9: [2023-05-10 12:37:40,330] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... + 9: [2023-05-10 12:37:40,330] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +26: [2023-05-10 12:37:40,329] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt. +27: [2023-05-10 12:37:40,330] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +21: [2023-05-10 12:37:40,330] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +11: [2023-05-10 12:37:40,330] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +21: [2023-05-10 12:37:40,330] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +27: [2023-05-10 12:37:40,330] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +21: [2023-05-10 12:37:40,330] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... + 9: [2023-05-10 12:37:40,333] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... + 9: [2023-05-10 12:37:40,333] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... + 0: [2023-05-10 12:37:40,334] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +14: [2023-05-10 12:37:40,336] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +14: [2023-05-10 12:37:40,337] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt... +25: [2023-05-10 12:37:40,337] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +25: [2023-05-10 12:37:40,338] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt... +25: [2023-05-10 12:37:40,339] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +25: [2023-05-10 12:37:40,339] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt... +18: [2023-05-10 12:37:40,339] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +25: [2023-05-10 12:37:40,339] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +18: [2023-05-10 12:37:40,339] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +25: [2023-05-10 12:37:40,339] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt... +10: [2023-05-10 12:37:40,340] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. + 7: [2023-05-10 12:37:40,340] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +10: [2023-05-10 12:37:40,340] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt... + 5: [2023-05-10 12:37:40,341] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. + 7: [2023-05-10 12:37:40,340] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +24: [2023-05-10 12:37:40,341] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt. + 7: [2023-05-10 12:37:40,341] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt... + 7: [2023-05-10 12:37:40,341] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt... +21: [2023-05-10 12:37:40,341] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +26: [2023-05-10 12:37:40,341] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +26: [2023-05-10 12:37:40,341] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... + 5: [2023-05-10 12:37:40,341] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt... +26: [2023-05-10 12:37:40,341] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +21: [2023-05-10 12:37:40,341] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt... +10: [2023-05-10 12:37:40,342] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. + 4: [2023-05-10 12:37:40,342] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +10: [2023-05-10 12:37:40,342] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt... + 4: [2023-05-10 12:37:40,342] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +17: [2023-05-10 12:37:40,342] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +17: [2023-05-10 12:37:40,342] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. + 5: [2023-05-10 12:37:40,342] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. + 4: [2023-05-10 12:37:40,342] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt... + 5: [2023-05-10 12:37:40,342] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt... + 4: [2023-05-10 12:37:40,342] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt... +17: [2023-05-10 12:37:40,343] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt... +17: [2023-05-10 12:37:40,343] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt... +24: [2023-05-10 12:37:40,343] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt. +25: [2023-05-10 12:37:40,343] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +25: [2023-05-10 12:37:40,343] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt... +27: [2023-05-10 12:37:40,343] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +17: [2023-05-10 12:37:40,343] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +17: [2023-05-10 12:37:40,343] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +17: [2023-05-10 12:37:40,343] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt... +26: [2023-05-10 12:37:40,343] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +17: [2023-05-10 12:37:40,344] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt... + 1: [2023-05-10 12:37:40,343] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt. + 1: [2023-05-10 12:37:40,343] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt. + 1: [2023-05-10 12:37:40,343] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt. + 9: [2023-05-10 12:37:40,344] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +14: [2023-05-10 12:37:40,344] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +14: [2023-05-10 12:37:40,344] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt... + 1: [2023-05-10 12:37:40,344] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt. +27: [2023-05-10 12:37:40,344] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt... + 9: [2023-05-10 12:37:40,344] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt... + 5: [2023-05-10 12:37:40,344] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. + 5: [2023-05-10 12:37:40,344] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt... +18: [2023-05-10 12:37:40,344] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +21: [2023-05-10 12:37:40,345] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +21: [2023-05-10 12:37:40,346] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt... +23: [2023-05-10 12:37:40,346] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt. +23: [2023-05-10 12:37:40,346] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt. +23: [2023-05-10 12:37:40,346] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt. + 7: [2023-05-10 12:37:40,346] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. + 7: [2023-05-10 12:37:40,346] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt... +23: [2023-05-10 12:37:40,346] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt. + 7: [2023-05-10 12:37:40,346] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. + 7: [2023-05-10 12:37:40,346] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt... +14: [2023-05-10 12:37:40,347] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +24: [2023-05-10 12:37:40,347] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt. +24: [2023-05-10 12:37:40,347] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt. +27: [2023-05-10 12:37:40,347] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +27: [2023-05-10 12:37:40,347] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt... + 4: [2023-05-10 12:37:40,347] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. + 4: [2023-05-10 12:37:40,347] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt... +14: [2023-05-10 12:37:40,348] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt... + 5: [2023-05-10 12:37:40,349] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. + 5: [2023-05-10 12:37:40,349] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt... + 3: [2023-05-10 12:37:40,348] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt. + 3: [2023-05-10 12:37:40,348] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt. + 3: [2023-05-10 12:37:40,348] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt. +24: [2023-05-10 12:37:40,349] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +21: [2023-05-10 12:37:40,350] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +21: [2023-05-10 12:37:40,350] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt... +18: [2023-05-10 12:37:40,351] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. + 8: [2023-05-10 12:37:40,351] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt. + 8: [2023-05-10 12:37:40,351] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt. + 8: [2023-05-10 12:37:40,351] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt. + 3: [2023-05-10 12:37:40,351] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt. + 9: [2023-05-10 12:37:40,350] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. + 9: [2023-05-10 12:37:40,350] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. + 9: [2023-05-10 12:37:40,351] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt... + 9: [2023-05-10 12:37:40,351] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt... + 8: [2023-05-10 12:37:40,351] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt. +24: [2023-05-10 12:37:40,352] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... + 9: [2023-05-10 12:37:40,352] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. + 9: [2023-05-10 12:37:40,353] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt... + 4: [2023-05-10 12:37:40,353] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +13: [2023-05-10 12:37:40,353] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt. +13: [2023-05-10 12:37:40,353] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt. +13: [2023-05-10 12:37:40,353] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt. +13: [2023-05-10 12:37:40,353] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt. + 4: [2023-05-10 12:37:40,354] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt... +18: [2023-05-10 12:37:40,354] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +10: [2023-05-10 12:37:40,354] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. + 1: [2023-05-10 12:37:40,355] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +11: [2023-05-10 12:37:40,355] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt. + 1: [2023-05-10 12:37:40,355] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +11: [2023-05-10 12:37:40,355] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt. +11: [2023-05-10 12:37:40,355] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt. + 1: [2023-05-10 12:37:40,355] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... + 1: [2023-05-10 12:37:40,355] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +29: [2023-05-10 12:37:40,355] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt. +29: [2023-05-10 12:37:40,355] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt. +29: [2023-05-10 12:37:40,355] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt. +29: [2023-05-10 12:37:40,355] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt. +23: [2023-05-10 12:37:40,356] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +23: [2023-05-10 12:37:40,356] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +27: [2023-05-10 12:37:40,355] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. + 2: [2023-05-10 12:37:40,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt. +10: [2023-05-10 12:37:40,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +10: [2023-05-10 12:37:40,356] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt... + 2: [2023-05-10 12:37:40,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt. +24: [2023-05-10 12:37:40,356] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +14: [2023-05-10 12:37:40,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +24: [2023-05-10 12:37:40,356] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +27: [2023-05-10 12:37:40,357] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt... +27: [2023-05-10 12:37:40,357] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +10: [2023-05-10 12:37:40,358] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt... +21: [2023-05-10 12:37:40,358] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +23: [2023-05-10 12:37:40,358] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... + 2: [2023-05-10 12:37:40,358] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt. + 3: [2023-05-10 12:37:40,358] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +23: [2023-05-10 12:37:40,358] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +14: [2023-05-10 12:37:40,359] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt... + 2: [2023-05-10 12:37:40,359] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt. + 6: [2023-05-10 12:37:40,358] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt. + 6: [2023-05-10 12:37:40,358] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt. + 6: [2023-05-10 12:37:40,358] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt. + 6: [2023-05-10 12:37:40,358] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt. +11: [2023-05-10 12:37:40,360] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_09-model_01-model_states.pt. +27: [2023-05-10 12:37:40,359] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt... + 3: [2023-05-10 12:37:40,360] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... + 3: [2023-05-10 12:37:40,360] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... + 8: [2023-05-10 12:37:40,360] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +18: [2023-05-10 12:37:40,360] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... + 8: [2023-05-10 12:37:40,360] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... + 3: [2023-05-10 12:37:40,361] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +21: [2023-05-10 12:37:40,361] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt... + 8: [2023-05-10 12:37:40,363] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... + 8: [2023-05-10 12:37:40,363] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +30: [2023-05-10 12:37:40,364] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt. +30: [2023-05-10 12:37:40,364] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt. +30: [2023-05-10 12:37:40,364] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt. +30: [2023-05-10 12:37:40,364] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt. +29: [2023-05-10 12:37:40,364] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +29: [2023-05-10 12:37:40,364] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +13: [2023-05-10 12:37:40,364] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +13: [2023-05-10 12:37:40,365] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +13: [2023-05-10 12:37:40,365] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +13: [2023-05-10 12:37:40,365] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... + 2: [2023-05-10 12:37:40,365] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... + 2: [2023-05-10 12:37:40,366] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +29: [2023-05-10 12:37:40,367] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... + 2: [2023-05-10 12:37:40,367] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... + 6: [2023-05-10 12:37:40,367] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +29: [2023-05-10 12:37:40,367] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... + 6: [2023-05-10 12:37:40,367] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... + 6: [2023-05-10 12:37:40,368] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +11: [2023-05-10 12:37:40,367] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +24: [2023-05-10 12:37:40,368] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +24: [2023-05-10 12:37:40,368] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. + 2: [2023-05-10 12:37:40,368] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... + 6: [2023-05-10 12:37:40,368] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +24: [2023-05-10 12:37:40,369] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt... +24: [2023-05-10 12:37:40,369] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt... +11: [2023-05-10 12:37:40,369] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +24: [2023-05-10 12:37:40,369] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +24: [2023-05-10 12:37:40,369] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt... + 1: [2023-05-10 12:37:40,370] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. + 1: [2023-05-10 12:37:40,370] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt... +11: [2023-05-10 12:37:40,370] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... +20: [2023-05-10 12:37:40,370] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt. +20: [2023-05-10 12:37:40,371] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt. +20: [2023-05-10 12:37:40,371] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt. +20: [2023-05-10 12:37:40,371] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt. + 1: [2023-05-10 12:37:40,372] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. + 1: [2023-05-10 12:37:40,372] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. + 1: [2023-05-10 12:37:40,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt... + 1: [2023-05-10 12:37:40,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt... + 1: [2023-05-10 12:37:40,372] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +30: [2023-05-10 12:37:40,373] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... + 3: [2023-05-10 12:37:40,372] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +30: [2023-05-10 12:37:40,373] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +30: [2023-05-10 12:37:40,373] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... + 1: [2023-05-10 12:37:40,373] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt... + 3: [2023-05-10 12:37:40,373] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +23: [2023-05-10 12:37:40,374] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +23: [2023-05-10 12:37:40,374] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. + 3: [2023-05-10 12:37:40,374] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt... + 3: [2023-05-10 12:37:40,374] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt... +30: [2023-05-10 12:37:40,374] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +23: [2023-05-10 12:37:40,374] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt... +23: [2023-05-10 12:37:40,374] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt... + 8: [2023-05-10 12:37:40,374] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +11: [2023-05-10 12:37:40,375] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt... + 8: [2023-05-10 12:37:40,375] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt... + 8: [2023-05-10 12:37:40,377] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. + 8: [2023-05-10 12:37:40,377] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt... +22: [2023-05-10 12:37:40,378] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt. +22: [2023-05-10 12:37:40,378] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt. +13: [2023-05-10 12:37:40,377] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +22: [2023-05-10 12:37:40,378] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt. +13: [2023-05-10 12:37:40,378] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt... +13: [2023-05-10 12:37:40,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +13: [2023-05-10 12:37:40,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt... + 2: [2023-05-10 12:37:40,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. + 2: [2023-05-10 12:37:40,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt... +20: [2023-05-10 12:37:40,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +11: [2023-05-10 12:37:40,380] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +11: [2023-05-10 12:37:40,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt... +20: [2023-05-10 12:37:40,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +20: [2023-05-10 12:37:40,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +24: [2023-05-10 12:37:40,381] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +20: [2023-05-10 12:37:40,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +19: [2023-05-10 12:37:40,381] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +11: [2023-05-10 12:37:40,381] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +19: [2023-05-10 12:37:40,381] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +19: [2023-05-10 12:37:40,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +19: [2023-05-10 12:37:40,381] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +11: [2023-05-10 12:37:40,382] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt... +19: [2023-05-10 12:37:40,382] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +19: [2023-05-10 12:37:40,382] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... + 2: [2023-05-10 12:37:40,382] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. + 2: [2023-05-10 12:37:40,382] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. + 2: [2023-05-10 12:37:40,382] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +22: [2023-05-10 12:37:40,382] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt. +24: [2023-05-10 12:37:40,382] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt... + 2: [2023-05-10 12:37:40,382] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt... + 2: [2023-05-10 12:37:40,382] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt... + 2: [2023-05-10 12:37:40,382] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt... +19: [2023-05-10 12:37:40,383] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +19: [2023-05-10 12:37:40,383] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +13: [2023-05-10 12:37:40,384] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +13: [2023-05-10 12:37:40,384] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt... +23: [2023-05-10 12:37:40,385] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +23: [2023-05-10 12:37:40,385] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +11: [2023-05-10 12:37:40,385] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +11: [2023-05-10 12:37:40,385] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt... +23: [2023-05-10 12:37:40,387] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt... +23: [2023-05-10 12:37:40,387] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt... +22: [2023-05-10 12:37:40,387] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +11: [2023-05-10 12:37:40,387] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +11: [2023-05-10 12:37:40,388] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt... + 3: [2023-05-10 12:37:40,388] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. + 3: [2023-05-10 12:37:40,388] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. + 3: [2023-05-10 12:37:40,388] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +22: [2023-05-10 12:37:40,388] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... + 3: [2023-05-10 12:37:40,388] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... + 3: [2023-05-10 12:37:40,388] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... + 3: [2023-05-10 12:37:40,388] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. + 3: [2023-05-10 12:37:40,389] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... + 3: [2023-05-10 12:37:40,389] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +22: [2023-05-10 12:37:40,389] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... + 3: [2023-05-10 12:37:40,389] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. + 3: [2023-05-10 12:37:40,390] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... + 3: [2023-05-10 12:37:40,391] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt... + 3: [2023-05-10 12:37:40,391] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt... +22: [2023-05-10 12:37:40,392] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +13: [2023-05-10 12:37:40,393] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. + 8: [2023-05-10 12:37:40,393] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. + 8: [2023-05-10 12:37:40,393] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_00-model_states.pt. +19: [2023-05-10 12:37:40,393] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +13: [2023-05-10 12:37:40,394] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt... + 8: [2023-05-10 12:37:40,395] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt... + 8: [2023-05-10 12:37:40,395] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt... +19: [2023-05-10 12:37:40,396] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +19: [2023-05-10 12:37:40,403] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +29: [2023-05-10 12:37:40,404] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +29: [2023-05-10 12:37:40,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +29: [2023-05-10 12:37:40,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +29: [2023-05-10 12:37:40,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +29: [2023-05-10 12:37:40,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +29: [2023-05-10 12:37:40,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +29: [2023-05-10 12:37:40,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +29: [2023-05-10 12:37:40,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +29: [2023-05-10 12:37:40,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +29: [2023-05-10 12:37:40,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +29: [2023-05-10 12:37:40,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +29: [2023-05-10 12:37:40,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt... +19: [2023-05-10 12:37:40,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +29: [2023-05-10 12:37:40,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt... +19: [2023-05-10 12:37:40,406] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +22: [2023-05-10 12:37:40,406] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +22: [2023-05-10 12:37:40,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +22: [2023-05-10 12:37:40,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +22: [2023-05-10 12:37:40,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +22: [2023-05-10 12:37:40,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +29: [2023-05-10 12:37:40,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt... +22: [2023-05-10 12:37:40,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +29: [2023-05-10 12:37:40,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +29: [2023-05-10 12:37:40,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt... +22: [2023-05-10 12:37:40,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +22: [2023-05-10 12:37:40,408] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt... + 3: [2023-05-10 12:37:40,408] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. + 3: [2023-05-10 12:37:40,408] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. + 3: [2023-05-10 12:37:40,408] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +19: [2023-05-10 12:37:40,408] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +22: [2023-05-10 12:37:40,409] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +22: [2023-05-10 12:37:40,409] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +22: [2023-05-10 12:37:40,412] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +22: [2023-05-10 12:37:40,412] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt... +22: [2023-05-10 12:37:40,412] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +22: [2023-05-10 12:37:40,413] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt... +29: [2023-05-10 12:37:40,415] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +19: [2023-05-10 12:37:40,416] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... + 6: [2023-05-10 12:37:40,417] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. + 6: [2023-05-10 12:37:40,417] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. + 6: [2023-05-10 12:37:40,417] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. + 6: [2023-05-10 12:37:40,417] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... + 6: [2023-05-10 12:37:40,417] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. + 6: [2023-05-10 12:37:40,417] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. + 6: [2023-05-10 12:37:40,417] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. + 6: [2023-05-10 12:37:40,417] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +19: [2023-05-10 12:37:40,417] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... + 6: [2023-05-10 12:37:40,417] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... + 6: [2023-05-10 12:37:40,417] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... + 6: [2023-05-10 12:37:40,417] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... + 6: [2023-05-10 12:37:40,417] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. + 6: [2023-05-10 12:37:40,417] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt... +29: [2023-05-10 12:37:40,417] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. + 6: [2023-05-10 12:37:40,417] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt... + 6: [2023-05-10 12:37:40,417] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt... + 3: [2023-05-10 12:37:40,417] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. + 3: [2023-05-10 12:37:40,418] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +22: [2023-05-10 12:37:40,418] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. + 6: [2023-05-10 12:37:40,419] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt... +22: [2023-05-10 12:37:40,419] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt... +22: [2023-05-10 12:37:40,419] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +29: [2023-05-10 12:37:40,419] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. + 3: [2023-05-10 12:37:40,423] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... + 3: [2023-05-10 12:37:40,423] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +29: [2023-05-10 12:37:40,424] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +22: [2023-05-10 12:37:40,425] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. + 3: [2023-05-10 12:37:40,426] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +29: [2023-05-10 12:37:40,427] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +22: [2023-05-10 12:37:40,429] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +29: [2023-05-10 12:37:40,430] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +19: [2023-05-10 12:37:40,430] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt. +19: [2023-05-10 12:37:40,430] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt. +19: [2023-05-10 12:37:40,430] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt. +19: [2023-05-10 12:37:40,431] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt. + 6: [2023-05-10 12:37:40,432] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. + 6: [2023-05-10 12:37:40,432] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. + 6: [2023-05-10 12:37:40,433] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. + 6: [2023-05-10 12:37:40,433] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +22: [2023-05-10 12:37:40,435] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +29: [2023-05-10 12:37:40,435] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +22: [2023-05-10 12:37:40,439] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +19: [2023-05-10 12:37:40,439] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +22: [2023-05-10 12:37:40,439] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +19: [2023-05-10 12:37:40,441] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +19: [2023-05-10 12:37:40,441] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +19: [2023-05-10 12:37:40,442] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... + 6: [2023-05-10 12:37:40,443] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... + 6: [2023-05-10 12:37:40,443] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... + 6: [2023-05-10 12:37:40,443] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +29: [2023-05-10 12:37:40,444] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... + 6: [2023-05-10 12:37:40,445] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +28: [2023-05-10 12:37:40,446] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt. +28: [2023-05-10 12:37:40,446] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt. +28: [2023-05-10 12:37:40,446] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt. +28: [2023-05-10 12:37:40,446] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt. +22: [2023-05-10 12:37:40,448] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +22: [2023-05-10 12:37:40,448] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +19: [2023-05-10 12:37:40,455] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +19: [2023-05-10 12:37:40,456] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt... +19: [2023-05-10 12:37:40,456] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +19: [2023-05-10 12:37:40,457] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt... +28: [2023-05-10 12:37:40,457] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +28: [2023-05-10 12:37:40,458] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +28: [2023-05-10 12:37:40,458] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +28: [2023-05-10 12:37:40,458] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +19: [2023-05-10 12:37:40,461] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +19: [2023-05-10 12:37:40,461] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt... +12: [2023-05-10 12:37:40,464] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt. +12: [2023-05-10 12:37:40,464] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt. +12: [2023-05-10 12:37:40,464] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt. +12: [2023-05-10 12:37:40,464] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt. +19: [2023-05-10 12:37:40,469] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +19: [2023-05-10 12:37:40,472] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt... +12: [2023-05-10 12:37:40,474] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +12: [2023-05-10 12:37:40,474] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +12: [2023-05-10 12:37:40,476] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +12: [2023-05-10 12:37:40,477] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... + 4: [2023-05-10 12:37:40,490] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. + 4: [2023-05-10 12:37:40,490] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. + 4: [2023-05-10 12:37:40,491] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... + 4: [2023-05-10 12:37:40,491] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. + 4: [2023-05-10 12:37:40,491] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. + 4: [2023-05-10 12:37:40,493] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... + 4: [2023-05-10 12:37:40,493] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... + 4: [2023-05-10 12:37:40,493] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... + 4: [2023-05-10 12:37:40,502] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +28: [2023-05-10 12:37:40,510] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +28: [2023-05-10 12:37:40,510] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +28: [2023-05-10 12:37:40,510] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +28: [2023-05-10 12:37:40,511] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +28: [2023-05-10 12:37:40,511] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt... +28: [2023-05-10 12:37:40,511] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt... +28: [2023-05-10 12:37:40,511] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +28: [2023-05-10 12:37:40,511] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +28: [2023-05-10 12:37:40,511] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +28: [2023-05-10 12:37:40,511] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +28: [2023-05-10 12:37:40,511] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +28: [2023-05-10 12:37:40,511] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +28: [2023-05-10 12:37:40,511] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... + 4: [2023-05-10 12:37:40,511] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +28: [2023-05-10 12:37:40,512] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt... +28: [2023-05-10 12:37:40,513] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt... +28: [2023-05-10 12:37:40,513] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... + 4: [2023-05-10 12:37:40,520] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. + 4: [2023-05-10 12:37:40,521] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. + 4: [2023-05-10 12:37:40,521] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +23: [2023-05-10 12:37:40,530] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +23: [2023-05-10 12:37:40,530] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +23: [2023-05-10 12:37:40,530] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +28: [2023-05-10 12:37:40,530] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +28: [2023-05-10 12:37:40,530] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. + 4: [2023-05-10 12:37:40,531] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... + 4: [2023-05-10 12:37:40,531] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... + 4: [2023-05-10 12:37:40,531] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +23: [2023-05-10 12:37:40,532] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +16: [2023-05-10 12:37:40,532] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt. +16: [2023-05-10 12:37:40,532] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt. +16: [2023-05-10 12:37:40,532] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt. +23: [2023-05-10 12:37:40,533] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +16: [2023-05-10 12:37:40,533] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt. +23: [2023-05-10 12:37:40,533] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +23: [2023-05-10 12:37:40,533] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +23: [2023-05-10 12:37:40,533] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +28: [2023-05-10 12:37:40,535] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +28: [2023-05-10 12:37:40,540] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +28: [2023-05-10 12:37:40,541] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +23: [2023-05-10 12:37:40,541] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +16: [2023-05-10 12:37:40,544] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +16: [2023-05-10 12:37:40,544] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +16: [2023-05-10 12:37:40,544] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +16: [2023-05-10 12:37:40,544] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +28: [2023-05-10 12:37:40,545] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +28: [2023-05-10 12:37:40,545] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +23: [2023-05-10 12:37:40,547] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +23: [2023-05-10 12:37:40,547] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. + 8: [2023-05-10 12:37:40,548] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. + 8: [2023-05-10 12:37:40,548] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. + 8: [2023-05-10 12:37:40,548] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. + 8: [2023-05-10 12:37:40,549] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +23: [2023-05-10 12:37:40,550] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... + 8: [2023-05-10 12:37:40,550] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... + 8: [2023-05-10 12:37:40,550] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... + 8: [2023-05-10 12:37:40,551] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... + 8: [2023-05-10 12:37:40,551] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +28: [2023-05-10 12:37:40,551] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... + 7: [2023-05-10 12:37:40,555] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt. + 7: [2023-05-10 12:37:40,555] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt. + 7: [2023-05-10 12:37:40,555] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt. + 7: [2023-05-10 12:37:40,555] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt. +23: [2023-05-10 12:37:40,557] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +23: [2023-05-10 12:37:40,557] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +23: [2023-05-10 12:37:40,557] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +12: [2023-05-10 12:37:40,563] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +12: [2023-05-10 12:37:40,564] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +12: [2023-05-10 12:37:40,564] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +12: [2023-05-10 12:37:40,564] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +12: [2023-05-10 12:37:40,564] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt... +12: [2023-05-10 12:37:40,564] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +12: [2023-05-10 12:37:40,564] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +12: [2023-05-10 12:37:40,564] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +12: [2023-05-10 12:37:40,564] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. + 1: [2023-05-10 12:37:40,564] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. + 1: [2023-05-10 12:37:40,564] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. + 1: [2023-05-10 12:37:40,564] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... + 1: [2023-05-10 12:37:40,564] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +12: [2023-05-10 12:37:40,564] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. + 7: [2023-05-10 12:37:40,565] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... + 7: [2023-05-10 12:37:40,565] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +12: [2023-05-10 12:37:40,565] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +10: [2023-05-10 12:37:40,565] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +10: [2023-05-10 12:37:40,565] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +20: [2023-05-10 12:37:40,565] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +10: [2023-05-10 12:37:40,565] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +10: [2023-05-10 12:37:40,565] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +10: [2023-05-10 12:37:40,565] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +10: [2023-05-10 12:37:40,566] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +10: [2023-05-10 12:37:40,566] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +20: [2023-05-10 12:37:40,566] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +20: [2023-05-10 12:37:40,566] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +20: [2023-05-10 12:37:40,566] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +20: [2023-05-10 12:37:40,566] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... + 7: [2023-05-10 12:37:40,566] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +30: [2023-05-10 12:37:40,566] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +30: [2023-05-10 12:37:40,566] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +30: [2023-05-10 12:37:40,566] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +12: [2023-05-10 12:37:40,566] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt... +20: [2023-05-10 12:37:40,566] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +20: [2023-05-10 12:37:40,566] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt... +12: [2023-05-10 12:37:40,566] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +30: [2023-05-10 12:37:40,566] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +30: [2023-05-10 12:37:40,566] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +30: [2023-05-10 12:37:40,566] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +30: [2023-05-10 12:37:40,566] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +30: [2023-05-10 12:37:40,566] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +23: [2023-05-10 12:37:40,566] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +30: [2023-05-10 12:37:40,566] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +30: [2023-05-10 12:37:40,566] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +31: [2023-05-10 12:37:40,566] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +12: [2023-05-10 12:37:40,566] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt... + 7: [2023-05-10 12:37:40,566] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +31: [2023-05-10 12:37:40,566] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +30: [2023-05-10 12:37:40,566] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +31: [2023-05-10 12:37:40,566] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +12: [2023-05-10 12:37:40,566] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... + 1: [2023-05-10 12:37:40,566] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. + 1: [2023-05-10 12:37:40,566] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... + 1: [2023-05-10 12:37:40,566] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +30: [2023-05-10 12:37:40,567] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt... +30: [2023-05-10 12:37:40,567] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt... +26: [2023-05-10 12:37:40,567] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +30: [2023-05-10 12:37:40,567] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt... +20: [2023-05-10 12:37:40,567] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +26: [2023-05-10 12:37:40,567] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +26: [2023-05-10 12:37:40,567] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +20: [2023-05-10 12:37:40,567] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +20: [2023-05-10 12:37:40,567] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +26: [2023-05-10 12:37:40,567] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +10: [2023-05-10 12:37:40,567] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +20: [2023-05-10 12:37:40,567] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +30: [2023-05-10 12:37:40,567] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +20: [2023-05-10 12:37:40,567] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +20: [2023-05-10 12:37:40,567] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt... +31: [2023-05-10 12:37:40,567] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +31: [2023-05-10 12:37:40,567] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +31: [2023-05-10 12:37:40,568] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +31: [2023-05-10 12:37:40,568] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... + 1: [2023-05-10 12:37:40,568] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +31: [2023-05-10 12:37:40,568] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +30: [2023-05-10 12:37:40,568] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt... +26: [2023-05-10 12:37:40,568] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +20: [2023-05-10 12:37:40,569] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +26: [2023-05-10 12:37:40,569] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +12: [2023-05-10 12:37:40,568] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt... +20: [2023-05-10 12:37:40,569] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt... +20: [2023-05-10 12:37:40,569] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt... +26: [2023-05-10 12:37:40,569] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +26: [2023-05-10 12:37:40,569] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +26: [2023-05-10 12:37:40,569] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +26: [2023-05-10 12:37:40,569] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +26: [2023-05-10 12:37:40,569] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +26: [2023-05-10 12:37:40,569] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +26: [2023-05-10 12:37:40,570] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt... +26: [2023-05-10 12:37:40,570] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt... +26: [2023-05-10 12:37:40,570] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt... +18: [2023-05-10 12:37:40,570] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt. +18: [2023-05-10 12:37:40,571] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt. +18: [2023-05-10 12:37:40,571] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt. +26: [2023-05-10 12:37:40,571] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt... +18: [2023-05-10 12:37:40,571] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt. + 8: [2023-05-10 12:37:40,571] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. + 5: [2023-05-10 12:37:40,573] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt. + 5: [2023-05-10 12:37:40,573] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt. + 5: [2023-05-10 12:37:40,573] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt. + 5: [2023-05-10 12:37:40,574] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt. +14: [2023-05-10 12:37:40,574] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt. +14: [2023-05-10 12:37:40,574] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt. +14: [2023-05-10 12:37:40,574] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt. +14: [2023-05-10 12:37:40,574] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt. +25: [2023-05-10 12:37:40,576] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt. +25: [2023-05-10 12:37:40,576] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt. +25: [2023-05-10 12:37:40,577] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt. +25: [2023-05-10 12:37:40,577] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt. +10: [2023-05-10 12:37:40,577] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +22: [2023-05-10 12:37:40,577] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt. +22: [2023-05-10 12:37:40,577] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt. +30: [2023-05-10 12:37:40,577] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +22: [2023-05-10 12:37:40,577] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt. +22: [2023-05-10 12:37:40,578] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt. + 8: [2023-05-10 12:37:40,578] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. + 8: [2023-05-10 12:37:40,578] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. + 1: [2023-05-10 12:37:40,579] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +26: [2023-05-10 12:37:40,579] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +31: [2023-05-10 12:37:40,579] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +12: [2023-05-10 12:37:40,579] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +12: [2023-05-10 12:37:40,579] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +18: [2023-05-10 12:37:40,580] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +18: [2023-05-10 12:37:40,580] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +26: [2023-05-10 12:37:40,580] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +18: [2023-05-10 12:37:40,580] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... + 8: [2023-05-10 12:37:40,580] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +20: [2023-05-10 12:37:40,580] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +31: [2023-05-10 12:37:40,581] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. + 1: [2023-05-10 12:37:40,581] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. + 1: [2023-05-10 12:37:40,581] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +20: [2023-05-10 12:37:40,581] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +20: [2023-05-10 12:37:40,581] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +31: [2023-05-10 12:37:40,581] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +18: [2023-05-10 12:37:40,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... + 8: [2023-05-10 12:37:40,582] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +31: [2023-05-10 12:37:40,582] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt. + 5: [2023-05-10 12:37:40,583] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +31: [2023-05-10 12:37:40,583] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt. + 5: [2023-05-10 12:37:40,583] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +14: [2023-05-10 12:37:40,583] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +30: [2023-05-10 12:37:40,583] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +30: [2023-05-10 12:37:40,583] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +31: [2023-05-10 12:37:40,584] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt. +14: [2023-05-10 12:37:40,584] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +14: [2023-05-10 12:37:40,584] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... + 5: [2023-05-10 12:37:40,584] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +14: [2023-05-10 12:37:40,584] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +10: [2023-05-10 12:37:40,584] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +26: [2023-05-10 12:37:40,584] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +26: [2023-05-10 12:37:40,585] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. + 5: [2023-05-10 12:37:40,585] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +10: [2023-05-10 12:37:40,585] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +10: [2023-05-10 12:37:40,585] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +31: [2023-05-10 12:37:40,585] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt. +30: [2023-05-10 12:37:40,586] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +25: [2023-05-10 12:37:40,586] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +25: [2023-05-10 12:37:40,586] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +22: [2023-05-10 12:37:40,587] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... + 8: [2023-05-10 12:37:40,587] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt. + 8: [2023-05-10 12:37:40,587] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt. +22: [2023-05-10 12:37:40,587] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +22: [2023-05-10 12:37:40,588] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +22: [2023-05-10 12:37:40,588] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... + 8: [2023-05-10 12:37:40,588] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +25: [2023-05-10 12:37:40,588] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +25: [2023-05-10 12:37:40,589] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +20: [2023-05-10 12:37:40,589] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +31: [2023-05-10 12:37:40,589] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +26: [2023-05-10 12:37:40,589] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +26: [2023-05-10 12:37:40,589] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +12: [2023-05-10 12:37:40,590] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +20: [2023-05-10 12:37:40,590] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... + 8: [2023-05-10 12:37:40,591] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +31: [2023-05-10 12:37:40,591] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +12: [2023-05-10 12:37:40,591] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +12: [2023-05-10 12:37:40,591] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... + 1: [2023-05-10 12:37:40,591] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... + 1: [2023-05-10 12:37:40,591] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +12: [2023-05-10 12:37:40,591] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. + 1: [2023-05-10 12:37:40,592] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +30: [2023-05-10 12:37:40,592] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... + 8: [2023-05-10 12:37:40,592] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +30: [2023-05-10 12:37:40,592] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +31: [2023-05-10 12:37:40,593] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +20: [2023-05-10 12:37:40,593] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... + 8: [2023-05-10 12:37:40,594] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt. +31: [2023-05-10 12:37:40,594] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... + 8: [2023-05-10 12:37:40,594] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt. +26: [2023-05-10 12:37:40,594] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +26: [2023-05-10 12:37:40,594] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +10: [2023-05-10 12:37:40,595] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +20: [2023-05-10 12:37:40,595] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +31: [2023-05-10 12:37:40,595] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +10: [2023-05-10 12:37:40,595] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +30: [2023-05-10 12:37:40,595] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +31: [2023-05-10 12:37:40,596] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... + 1: [2023-05-10 12:37:40,596] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +31: [2023-05-10 12:37:40,596] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... + 9: [2023-05-10 12:37:40,596] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. + 9: [2023-05-10 12:37:40,596] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. + 9: [2023-05-10 12:37:40,596] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... + 9: [2023-05-10 12:37:40,596] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. + 9: [2023-05-10 12:37:40,596] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... + 9: [2023-05-10 12:37:40,597] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... + 9: [2023-05-10 12:37:40,597] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. + 9: [2023-05-10 12:37:40,597] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +31: [2023-05-10 12:37:40,597] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +10: [2023-05-10 12:37:40,598] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. + 8: [2023-05-10 12:37:40,599] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... + 8: [2023-05-10 12:37:40,599] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +12: [2023-05-10 12:37:40,600] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +12: [2023-05-10 12:37:40,601] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +15: [2023-05-10 12:37:40,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt. +15: [2023-05-10 12:37:40,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt. +15: [2023-05-10 12:37:40,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt. +30: [2023-05-10 12:37:40,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +20: [2023-05-10 12:37:40,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +15: [2023-05-10 12:37:40,604] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt. + 1: [2023-05-10 12:37:40,604] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... + 8: [2023-05-10 12:37:40,605] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... + 8: [2023-05-10 12:37:40,605] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +31: [2023-05-10 12:37:40,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +10: [2023-05-10 12:37:40,607] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +29: [2023-05-10 12:37:40,608] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt. + 9: [2023-05-10 12:37:40,609] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. + 9: [2023-05-10 12:37:40,609] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. + 9: [2023-05-10 12:37:40,610] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. + 9: [2023-05-10 12:37:40,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +29: [2023-05-10 12:37:40,612] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt. +31: [2023-05-10 12:37:40,612] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +31: [2023-05-10 12:37:40,613] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt... +29: [2023-05-10 12:37:40,613] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt. +29: [2023-05-10 12:37:40,613] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt. +15: [2023-05-10 12:37:40,613] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... + 8: [2023-05-10 12:37:40,613] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +15: [2023-05-10 12:37:40,614] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +15: [2023-05-10 12:37:40,615] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +15: [2023-05-10 12:37:40,615] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... + 8: [2023-05-10 12:37:40,615] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt... +31: [2023-05-10 12:37:40,615] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +31: [2023-05-10 12:37:40,615] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt... + 9: [2023-05-10 12:37:40,618] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... + 9: [2023-05-10 12:37:40,619] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +31: [2023-05-10 12:37:40,621] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. + 8: [2023-05-10 12:37:40,621] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. + 8: [2023-05-10 12:37:40,621] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt... +21: [2023-05-10 12:37:40,621] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +21: [2023-05-10 12:37:40,621] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +21: [2023-05-10 12:37:40,621] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... + 9: [2023-05-10 12:37:40,621] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +29: [2023-05-10 12:37:40,621] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +29: [2023-05-10 12:37:40,621] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +29: [2023-05-10 12:37:40,622] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... + 9: [2023-05-10 12:37:40,622] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +29: [2023-05-10 12:37:40,622] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +31: [2023-05-10 12:37:40,622] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt... +21: [2023-05-10 12:37:40,623] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +21: [2023-05-10 12:37:40,624] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +21: [2023-05-10 12:37:40,624] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +31: [2023-05-10 12:37:40,626] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +21: [2023-05-10 12:37:40,626] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +21: [2023-05-10 12:37:40,626] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... + 8: [2023-05-10 12:37:40,626] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. + 8: [2023-05-10 12:37:40,626] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. + 8: [2023-05-10 12:37:40,627] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt... +31: [2023-05-10 12:37:40,627] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt... +14: [2023-05-10 12:37:40,628] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +14: [2023-05-10 12:37:40,628] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +14: [2023-05-10 12:37:40,628] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... + 8: [2023-05-10 12:37:40,628] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt... +14: [2023-05-10 12:37:40,629] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt... +14: [2023-05-10 12:37:40,630] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +14: [2023-05-10 12:37:40,630] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +14: [2023-05-10 12:37:40,630] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +14: [2023-05-10 12:37:40,630] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +14: [2023-05-10 12:37:40,630] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt... +14: [2023-05-10 12:37:40,630] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +14: [2023-05-10 12:37:40,630] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +14: [2023-05-10 12:37:40,630] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +14: [2023-05-10 12:37:40,630] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt... + 4: [2023-05-10 12:37:40,630] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt. + 4: [2023-05-10 12:37:40,630] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt. + 0: [2023-05-10 12:37:40,630] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt. + 4: [2023-05-10 12:37:40,630] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt. + 0: [2023-05-10 12:37:40,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt. + 0: [2023-05-10 12:37:40,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt. + 0: [2023-05-10 12:37:40,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt. +14: [2023-05-10 12:37:40,631] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt... +14: [2023-05-10 12:37:40,632] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +14: [2023-05-10 12:37:40,632] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +21: [2023-05-10 12:37:40,634] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. + 4: [2023-05-10 12:37:40,635] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt. + 3: [2023-05-10 12:37:40,637] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt. + 3: [2023-05-10 12:37:40,638] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt. + 3: [2023-05-10 12:37:40,639] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt. +13: [2023-05-10 12:37:40,640] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +13: [2023-05-10 12:37:40,640] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... + 4: [2023-05-10 12:37:40,640] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... + 4: [2023-05-10 12:37:40,640] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... + 3: [2023-05-10 12:37:40,640] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt. +13: [2023-05-10 12:37:40,640] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. + 0: [2023-05-10 12:37:40,640] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +13: [2023-05-10 12:37:40,640] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +13: [2023-05-10 12:37:40,640] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +13: [2023-05-10 12:37:40,640] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +24: [2023-05-10 12:37:40,640] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt. +24: [2023-05-10 12:37:40,640] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt. + 0: [2023-05-10 12:37:40,640] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +13: [2023-05-10 12:37:40,641] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +24: [2023-05-10 12:37:40,641] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt. + 9: [2023-05-10 12:37:40,641] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt. + 9: [2023-05-10 12:37:40,641] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt. + 9: [2023-05-10 12:37:40,641] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt. +24: [2023-05-10 12:37:40,641] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt. + 9: [2023-05-10 12:37:40,641] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt. +14: [2023-05-10 12:37:40,641] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. + 4: [2023-05-10 12:37:40,642] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... + 0: [2023-05-10 12:37:40,642] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +14: [2023-05-10 12:37:40,642] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +11: [2023-05-10 12:37:40,642] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt. +11: [2023-05-10 12:37:40,642] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt. + 1: [2023-05-10 12:37:40,642] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt. + 1: [2023-05-10 12:37:40,642] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt. + 1: [2023-05-10 12:37:40,642] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt. +13: [2023-05-10 12:37:40,642] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... + 1: [2023-05-10 12:37:40,642] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt. +11: [2023-05-10 12:37:40,642] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt. +17: [2023-05-10 12:37:40,643] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt. +17: [2023-05-10 12:37:40,643] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt. +11: [2023-05-10 12:37:40,643] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt. +17: [2023-05-10 12:37:40,643] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt. +17: [2023-05-10 12:37:40,643] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt. + 0: [2023-05-10 12:37:40,643] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... + 2: [2023-05-10 12:37:40,643] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. + 2: [2023-05-10 12:37:40,643] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. + 2: [2023-05-10 12:37:40,644] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... + 2: [2023-05-10 12:37:40,644] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. + 2: [2023-05-10 12:37:40,644] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +10: [2023-05-10 12:37:40,644] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt. + 2: [2023-05-10 12:37:40,644] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... + 2: [2023-05-10 12:37:40,644] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +10: [2023-05-10 12:37:40,644] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt. + 2: [2023-05-10 12:37:40,644] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +16: [2023-05-10 12:37:40,644] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +16: [2023-05-10 12:37:40,644] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... + 4: [2023-05-10 12:37:40,644] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +16: [2023-05-10 12:37:40,644] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +16: [2023-05-10 12:37:40,644] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +16: [2023-05-10 12:37:40,644] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +10: [2023-05-10 12:37:40,644] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt. +16: [2023-05-10 12:37:40,644] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +16: [2023-05-10 12:37:40,644] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +16: [2023-05-10 12:37:40,644] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +16: [2023-05-10 12:37:40,644] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +16: [2023-05-10 12:37:40,644] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +16: [2023-05-10 12:37:40,644] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +10: [2023-05-10 12:37:40,644] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt. +16: [2023-05-10 12:37:40,645] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt... +16: [2023-05-10 12:37:40,645] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt... +16: [2023-05-10 12:37:40,645] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt... +23: [2023-05-10 12:37:40,645] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt. +23: [2023-05-10 12:37:40,645] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt. +16: [2023-05-10 12:37:40,646] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +16: [2023-05-10 12:37:40,646] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt... +21: [2023-05-10 12:37:40,646] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +23: [2023-05-10 12:37:40,646] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt. +23: [2023-05-10 12:37:40,646] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt. + 3: [2023-05-10 12:37:40,647] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +13: [2023-05-10 12:37:40,648] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt. +27: [2023-05-10 12:37:40,647] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt. +27: [2023-05-10 12:37:40,647] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt. +27: [2023-05-10 12:37:40,647] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt. +27: [2023-05-10 12:37:40,648] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt. +13: [2023-05-10 12:37:40,648] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt. + 3: [2023-05-10 12:37:40,649] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... + 3: [2023-05-10 12:37:40,649] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... + 3: [2023-05-10 12:37:40,649] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +14: [2023-05-10 12:37:40,649] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +24: [2023-05-10 12:37:40,649] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... + 2: [2023-05-10 12:37:40,649] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt. + 2: [2023-05-10 12:37:40,650] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt. + 2: [2023-05-10 12:37:40,650] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt. + 9: [2023-05-10 12:37:40,650] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... + 2: [2023-05-10 12:37:40,650] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt. +24: [2023-05-10 12:37:40,650] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +13: [2023-05-10 12:37:40,650] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt. +24: [2023-05-10 12:37:40,650] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +13: [2023-05-10 12:37:40,651] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt. + 1: [2023-05-10 12:37:40,651] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +21: [2023-05-10 12:37:40,651] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. + 1: [2023-05-10 12:37:40,651] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... + 9: [2023-05-10 12:37:40,651] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +21: [2023-05-10 12:37:40,652] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +14: [2023-05-10 12:37:40,652] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +24: [2023-05-10 12:37:40,652] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... + 1: [2023-05-10 12:37:40,653] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +10: [2023-05-10 12:37:40,653] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +10: [2023-05-10 12:37:40,653] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +10: [2023-05-10 12:37:40,654] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +17: [2023-05-10 12:37:40,654] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +17: [2023-05-10 12:37:40,654] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... + 1: [2023-05-10 12:37:40,654] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +23: [2023-05-10 12:37:40,654] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +23: [2023-05-10 12:37:40,654] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... + 9: [2023-05-10 12:37:40,654] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... + 9: [2023-05-10 12:37:40,655] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +17: [2023-05-10 12:37:40,655] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +17: [2023-05-10 12:37:40,655] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +11: [2023-05-10 12:37:40,655] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +21: [2023-05-10 12:37:40,656] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +10: [2023-05-10 12:37:40,656] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +16: [2023-05-10 12:37:40,656] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. + 4: [2023-05-10 12:37:40,656] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. + 4: [2023-05-10 12:37:40,656] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. + 4: [2023-05-10 12:37:40,656] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt... + 4: [2023-05-10 12:37:40,656] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt... +23: [2023-05-10 12:37:40,657] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... + 4: [2023-05-10 12:37:40,657] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. + 4: [2023-05-10 12:37:40,657] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt... +14: [2023-05-10 12:37:40,657] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +13: [2023-05-10 12:37:40,657] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +13: [2023-05-10 12:37:40,657] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +11: [2023-05-10 12:37:40,657] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +14: [2023-05-10 12:37:40,658] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +23: [2023-05-10 12:37:40,658] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +11: [2023-05-10 12:37:40,659] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +13: [2023-05-10 12:37:40,659] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +27: [2023-05-10 12:37:40,660] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +27: [2023-05-10 12:37:40,660] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... + 2: [2023-05-10 12:37:40,660] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +24: [2023-05-10 12:37:40,660] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +24: [2023-05-10 12:37:40,660] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +24: [2023-05-10 12:37:40,660] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +27: [2023-05-10 12:37:40,660] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +27: [2023-05-10 12:37:40,660] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... + 2: [2023-05-10 12:37:40,660] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. + 2: [2023-05-10 12:37:40,660] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. + 2: [2023-05-10 12:37:40,661] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +11: [2023-05-10 12:37:40,661] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +24: [2023-05-10 12:37:40,662] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +16: [2023-05-10 12:37:40,661] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +16: [2023-05-10 12:37:40,661] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +24: [2023-05-10 12:37:40,662] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +24: [2023-05-10 12:37:40,662] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +24: [2023-05-10 12:37:40,662] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +24: [2023-05-10 12:37:40,663] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... + 9: [2023-05-10 12:37:40,663] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +13: [2023-05-10 12:37:40,664] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... + 9: [2023-05-10 12:37:40,664] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt... +21: [2023-05-10 12:37:40,664] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... + 6: [2023-05-10 12:37:40,664] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt. + 6: [2023-05-10 12:37:40,664] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt. + 6: [2023-05-10 12:37:40,664] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt. + 6: [2023-05-10 12:37:40,664] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt. +21: [2023-05-10 12:37:40,664] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... + 2: [2023-05-10 12:37:40,664] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... + 3: [2023-05-10 12:37:40,665] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. + 2: [2023-05-10 12:37:40,665] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... + 3: [2023-05-10 12:37:40,665] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +24: [2023-05-10 12:37:40,665] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +13: [2023-05-10 12:37:40,665] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... + 3: [2023-05-10 12:37:40,666] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt... + 3: [2023-05-10 12:37:40,666] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt... +24: [2023-05-10 12:37:40,666] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt... +16: [2023-05-10 12:37:40,666] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... + 3: [2023-05-10 12:37:40,666] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. + 3: [2023-05-10 12:37:40,666] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt... +14: [2023-05-10 12:37:40,666] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +14: [2023-05-10 12:37:40,667] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... + 1: [2023-05-10 12:37:40,667] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. + 1: [2023-05-10 12:37:40,667] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +13: [2023-05-10 12:37:40,667] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... + 1: [2023-05-10 12:37:40,667] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt... + 1: [2023-05-10 12:37:40,667] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt... + 4: [2023-05-10 12:37:40,668] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +21: [2023-05-10 12:37:40,668] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +13: [2023-05-10 12:37:40,668] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +13: [2023-05-10 12:37:40,668] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. + 3: [2023-05-10 12:37:40,668] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. + 3: [2023-05-10 12:37:40,668] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt... + 2: [2023-05-10 12:37:40,668] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... + 4: [2023-05-10 12:37:40,669] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt... + 7: [2023-05-10 12:37:40,669] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. + 7: [2023-05-10 12:37:40,669] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. + 7: [2023-05-10 12:37:40,669] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +10: [2023-05-10 12:37:40,669] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +10: [2023-05-10 12:37:40,669] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. + 7: [2023-05-10 12:37:40,669] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. + 7: [2023-05-10 12:37:40,670] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt... +23: [2023-05-10 12:37:40,669] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. + 7: [2023-05-10 12:37:40,670] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. + 7: [2023-05-10 12:37:40,670] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. + 7: [2023-05-10 12:37:40,670] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. + 2: [2023-05-10 12:37:40,670] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... + 7: [2023-05-10 12:37:40,670] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt... + 7: [2023-05-10 12:37:40,670] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. + 7: [2023-05-10 12:37:40,670] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +10: [2023-05-10 12:37:40,670] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt... +10: [2023-05-10 12:37:40,670] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt... +23: [2023-05-10 12:37:40,670] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt... +24: [2023-05-10 12:37:40,670] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +24: [2023-05-10 12:37:40,671] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +24: [2023-05-10 12:37:40,671] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt... +24: [2023-05-10 12:37:40,671] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt... +16: [2023-05-10 12:37:40,671] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... + 7: [2023-05-10 12:37:40,671] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... + 7: [2023-05-10 12:37:40,671] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +16: [2023-05-10 12:37:40,671] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +16: [2023-05-10 12:37:40,672] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... + 7: [2023-05-10 12:37:40,672] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt... + 7: [2023-05-10 12:37:40,672] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt... + 7: [2023-05-10 12:37:40,672] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... + 6: [2023-05-10 12:37:40,673] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +23: [2023-05-10 12:37:40,673] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +23: [2023-05-10 12:37:40,673] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt... + 6: [2023-05-10 12:37:40,673] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... + 6: [2023-05-10 12:37:40,673] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +10: [2023-05-10 12:37:40,674] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +10: [2023-05-10 12:37:40,674] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt... + 9: [2023-05-10 12:37:40,673] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. + 9: [2023-05-10 12:37:40,674] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt... + 2: [2023-05-10 12:37:40,675] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +24: [2023-05-10 12:37:40,675] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. + 6: [2023-05-10 12:37:40,675] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +13: [2023-05-10 12:37:40,676] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +13: [2023-05-10 12:37:40,676] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt... + 2: [2023-05-10 12:37:40,676] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +23: [2023-05-10 12:37:40,676] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +23: [2023-05-10 12:37:40,676] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt... + 9: [2023-05-10 12:37:40,676] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. + 9: [2023-05-10 12:37:40,677] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt... + 2: [2023-05-10 12:37:40,677] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +24: [2023-05-10 12:37:40,678] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. + 1: [2023-05-10 12:37:40,678] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +24: [2023-05-10 12:37:40,678] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +13: [2023-05-10 12:37:40,679] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +13: [2023-05-10 12:37:40,679] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt... +13: [2023-05-10 12:37:40,679] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +23: [2023-05-10 12:37:40,679] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +23: [2023-05-10 12:37:40,679] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt... +24: [2023-05-10 12:37:40,679] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt... + 1: [2023-05-10 12:37:40,679] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt... + 1: [2023-05-10 12:37:40,680] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +24: [2023-05-10 12:37:40,680] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +16: [2023-05-10 12:37:40,680] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... + 2: [2023-05-10 12:37:40,680] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +10: [2023-05-10 12:37:40,681] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. + 1: [2023-05-10 12:37:40,681] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt... + 9: [2023-05-10 12:37:40,682] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +13: [2023-05-10 12:37:40,682] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +10: [2023-05-10 12:37:40,683] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt... + 9: [2023-05-10 12:37:40,683] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt... + 2: [2023-05-10 12:37:40,683] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. + 2: [2023-05-10 12:37:40,684] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt... +24: [2023-05-10 12:37:40,685] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +21: [2023-05-10 12:37:40,686] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt. +21: [2023-05-10 12:37:40,686] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt. +21: [2023-05-10 12:37:40,686] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt. +21: [2023-05-10 12:37:40,687] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_10-model_01-model_states.pt. +24: [2023-05-10 12:37:40,687] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +11: [2023-05-10 12:37:40,687] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +11: [2023-05-10 12:37:40,687] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +11: [2023-05-10 12:37:40,687] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +11: [2023-05-10 12:37:40,687] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +11: [2023-05-10 12:37:40,687] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +11: [2023-05-10 12:37:40,687] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +11: [2023-05-10 12:37:40,688] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +11: [2023-05-10 12:37:40,688] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +11: [2023-05-10 12:37:40,688] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +11: [2023-05-10 12:37:40,688] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt... +11: [2023-05-10 12:37:40,688] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +11: [2023-05-10 12:37:40,688] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt... + 7: [2023-05-10 12:37:40,688] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +24: [2023-05-10 12:37:40,688] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +11: [2023-05-10 12:37:40,688] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +11: [2023-05-10 12:37:40,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt... +11: [2023-05-10 12:37:40,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt... +11: [2023-05-10 12:37:40,691] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +24: [2023-05-10 12:37:40,691] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +13: [2023-05-10 12:37:40,692] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. + 2: [2023-05-10 12:37:40,696] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +13: [2023-05-10 12:37:40,696] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +13: [2023-05-10 12:37:40,696] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt... + 7: [2023-05-10 12:37:40,696] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +24: [2023-05-10 12:37:40,697] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... + 7: [2023-05-10 12:37:40,697] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +25: [2023-05-10 12:37:40,697] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +25: [2023-05-10 12:37:40,697] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +25: [2023-05-10 12:37:40,697] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +25: [2023-05-10 12:37:40,697] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +25: [2023-05-10 12:37:40,697] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +25: [2023-05-10 12:37:40,697] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +25: [2023-05-10 12:37:40,697] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +25: [2023-05-10 12:37:40,697] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +25: [2023-05-10 12:37:40,697] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +25: [2023-05-10 12:37:40,697] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +25: [2023-05-10 12:37:40,698] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt... +25: [2023-05-10 12:37:40,699] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +21: [2023-05-10 12:37:40,699] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +25: [2023-05-10 12:37:40,699] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt... + 2: [2023-05-10 12:37:40,699] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt... + 2: [2023-05-10 12:37:40,699] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +21: [2023-05-10 12:37:40,699] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +25: [2023-05-10 12:37:40,699] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt... +21: [2023-05-10 12:37:40,699] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +25: [2023-05-10 12:37:40,700] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +25: [2023-05-10 12:37:40,700] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt... +13: [2023-05-10 12:37:40,701] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... + 2: [2023-05-10 12:37:40,702] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt... + 2: [2023-05-10 12:37:40,702] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +21: [2023-05-10 12:37:40,702] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +11: [2023-05-10 12:37:40,703] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +13: [2023-05-10 12:37:40,703] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. + 7: [2023-05-10 12:37:40,704] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. + 7: [2023-05-10 12:37:40,704] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +11: [2023-05-10 12:37:40,704] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +11: [2023-05-10 12:37:40,704] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +13: [2023-05-10 12:37:40,705] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt... + 7: [2023-05-10 12:37:40,705] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... + 2: [2023-05-10 12:37:40,705] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt... + 7: [2023-05-10 12:37:40,713] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... + 7: [2023-05-10 12:37:40,713] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +25: [2023-05-10 12:37:40,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +25: [2023-05-10 12:37:40,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +21: [2023-05-10 12:37:40,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +21: [2023-05-10 12:37:40,716] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt... +11: [2023-05-10 12:37:40,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +11: [2023-05-10 12:37:40,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +11: [2023-05-10 12:37:40,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +21: [2023-05-10 12:37:40,720] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +21: [2023-05-10 12:37:40,720] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt... +11: [2023-05-10 12:37:40,720] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +25: [2023-05-10 12:37:40,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +25: [2023-05-10 12:37:40,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +25: [2023-05-10 12:37:40,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +25: [2023-05-10 12:37:40,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +21: [2023-05-10 12:37:40,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +21: [2023-05-10 12:37:40,726] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt... +17: [2023-05-10 12:37:40,727] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +17: [2023-05-10 12:37:40,727] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +17: [2023-05-10 12:37:40,727] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +17: [2023-05-10 12:37:40,728] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +17: [2023-05-10 12:37:40,728] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +17: [2023-05-10 12:37:40,728] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +17: [2023-05-10 12:37:40,728] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +17: [2023-05-10 12:37:40,728] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt... +17: [2023-05-10 12:37:40,728] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +17: [2023-05-10 12:37:40,728] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +17: [2023-05-10 12:37:40,728] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +17: [2023-05-10 12:37:40,729] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +17: [2023-05-10 12:37:40,729] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt... +17: [2023-05-10 12:37:40,730] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +17: [2023-05-10 12:37:40,730] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt... +21: [2023-05-10 12:37:40,730] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +17: [2023-05-10 12:37:40,730] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt... +11: [2023-05-10 12:37:40,731] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +21: [2023-05-10 12:37:40,732] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt... +25: [2023-05-10 12:37:40,732] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +25: [2023-05-10 12:37:40,733] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... + 0: [2023-05-10 12:37:40,734] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. + 0: [2023-05-10 12:37:40,735] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. + 0: [2023-05-10 12:37:40,735] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +15: [2023-05-10 12:37:40,735] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. + 0: [2023-05-10 12:37:40,735] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +15: [2023-05-10 12:37:40,735] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. + 0: [2023-05-10 12:37:40,735] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. + 0: [2023-05-10 12:37:40,735] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... + 0: [2023-05-10 12:37:40,735] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. + 0: [2023-05-10 12:37:40,735] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... + 0: [2023-05-10 12:37:40,735] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. + 0: [2023-05-10 12:37:40,735] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +15: [2023-05-10 12:37:40,735] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... + 0: [2023-05-10 12:37:40,735] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +15: [2023-05-10 12:37:40,735] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +15: [2023-05-10 12:37:40,735] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +15: [2023-05-10 12:37:40,735] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +15: [2023-05-10 12:37:40,735] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +15: [2023-05-10 12:37:40,735] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +15: [2023-05-10 12:37:40,735] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. + 0: [2023-05-10 12:37:40,736] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt... +15: [2023-05-10 12:37:40,736] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... + 0: [2023-05-10 12:37:40,736] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt... +15: [2023-05-10 12:37:40,736] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt... +15: [2023-05-10 12:37:40,736] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt... +27: [2023-05-10 12:37:40,736] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +18: [2023-05-10 12:37:40,736] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +18: [2023-05-10 12:37:40,736] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +27: [2023-05-10 12:37:40,736] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +27: [2023-05-10 12:37:40,736] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +27: [2023-05-10 12:37:40,736] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +27: [2023-05-10 12:37:40,736] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +27: [2023-05-10 12:37:40,736] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +27: [2023-05-10 12:37:40,736] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +27: [2023-05-10 12:37:40,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt... +27: [2023-05-10 12:37:40,737] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +27: [2023-05-10 12:37:40,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt... +27: [2023-05-10 12:37:40,737] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +18: [2023-05-10 12:37:40,737] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +27: [2023-05-10 12:37:40,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt... +18: [2023-05-10 12:37:40,737] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +18: [2023-05-10 12:37:40,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt... +18: [2023-05-10 12:37:40,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt... +27: [2023-05-10 12:37:40,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +18: [2023-05-10 12:37:40,737] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +18: [2023-05-10 12:37:40,737] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +18: [2023-05-10 12:37:40,737] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +18: [2023-05-10 12:37:40,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +18: [2023-05-10 12:37:40,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +18: [2023-05-10 12:37:40,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +18: [2023-05-10 12:37:40,737] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +18: [2023-05-10 12:37:40,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt... +15: [2023-05-10 12:37:40,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt... + 0: [2023-05-10 12:37:40,738] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt... +18: [2023-05-10 12:37:40,738] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt... + 0: [2023-05-10 12:37:40,738] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt... +15: [2023-05-10 12:37:40,738] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +15: [2023-05-10 12:37:40,738] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +15: [2023-05-10 12:37:40,738] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt... +27: [2023-05-10 12:37:40,738] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +27: [2023-05-10 12:37:40,738] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +27: [2023-05-10 12:37:40,738] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt... +18: [2023-05-10 12:37:40,738] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... + 0: [2023-05-10 12:37:40,739] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +17: [2023-05-10 12:37:40,739] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +17: [2023-05-10 12:37:40,741] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +17: [2023-05-10 12:37:40,743] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. + 5: [2023-05-10 12:37:40,744] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. + 5: [2023-05-10 12:37:40,744] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. + 5: [2023-05-10 12:37:40,744] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. + 5: [2023-05-10 12:37:40,744] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... + 5: [2023-05-10 12:37:40,744] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. + 5: [2023-05-10 12:37:40,744] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. + 5: [2023-05-10 12:37:40,745] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt... + 5: [2023-05-10 12:37:40,745] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt... + 5: [2023-05-10 12:37:40,745] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... + 5: [2023-05-10 12:37:40,745] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. + 5: [2023-05-10 12:37:40,745] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. + 5: [2023-05-10 12:37:40,745] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt... + 5: [2023-05-10 12:37:40,745] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. + 5: [2023-05-10 12:37:40,746] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... + 5: [2023-05-10 12:37:40,747] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt... + 5: [2023-05-10 12:37:40,747] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt... +15: [2023-05-10 12:37:40,747] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +27: [2023-05-10 12:37:40,748] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +15: [2023-05-10 12:37:40,751] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +17: [2023-05-10 12:37:40,750] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... + 4: [2023-05-10 12:37:40,751] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. + 4: [2023-05-10 12:37:40,751] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... + 4: [2023-05-10 12:37:40,751] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. + 4: [2023-05-10 12:37:40,751] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. + 4: [2023-05-10 12:37:40,751] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +27: [2023-05-10 12:37:40,750] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. + 4: [2023-05-10 12:37:40,751] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +17: [2023-05-10 12:37:40,752] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +28: [2023-05-10 12:37:40,752] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. + 4: [2023-05-10 12:37:40,752] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. + 4: [2023-05-10 12:37:40,753] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +28: [2023-05-10 12:37:40,752] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +28: [2023-05-10 12:37:40,752] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +28: [2023-05-10 12:37:40,752] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +28: [2023-05-10 12:37:40,753] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +28: [2023-05-10 12:37:40,753] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +28: [2023-05-10 12:37:40,753] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +17: [2023-05-10 12:37:40,753] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +28: [2023-05-10 12:37:40,755] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +15: [2023-05-10 12:37:40,755] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +17: [2023-05-10 12:37:40,758] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +27: [2023-05-10 12:37:40,758] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... + 5: [2023-05-10 12:37:40,758] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. + 0: [2023-05-10 12:37:40,759] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. + 0: [2023-05-10 12:37:40,759] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. + 0: [2023-05-10 12:37:40,759] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +27: [2023-05-10 12:37:40,760] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +18: [2023-05-10 12:37:40,760] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +18: [2023-05-10 12:37:40,760] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +18: [2023-05-10 12:37:40,760] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. + 5: [2023-05-10 12:37:40,761] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +15: [2023-05-10 12:37:40,761] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... + 4: [2023-05-10 12:37:40,762] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +27: [2023-05-10 12:37:40,763] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +19: [2023-05-10 12:37:40,763] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +19: [2023-05-10 12:37:40,763] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +19: [2023-05-10 12:37:40,764] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +19: [2023-05-10 12:37:40,764] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +28: [2023-05-10 12:37:40,764] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +29: [2023-05-10 12:37:40,765] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +27: [2023-05-10 12:37:40,765] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +29: [2023-05-10 12:37:40,765] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +19: [2023-05-10 12:37:40,765] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +19: [2023-05-10 12:37:40,765] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +29: [2023-05-10 12:37:40,765] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +29: [2023-05-10 12:37:40,765] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +29: [2023-05-10 12:37:40,765] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +29: [2023-05-10 12:37:40,765] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +19: [2023-05-10 12:37:40,765] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +29: [2023-05-10 12:37:40,765] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +29: [2023-05-10 12:37:40,765] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +29: [2023-05-10 12:37:40,765] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +29: [2023-05-10 12:37:40,765] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +29: [2023-05-10 12:37:40,765] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +19: [2023-05-10 12:37:40,765] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +29: [2023-05-10 12:37:40,765] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +29: [2023-05-10 12:37:40,766] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt... +29: [2023-05-10 12:37:40,766] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt... +29: [2023-05-10 12:37:40,766] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt... +15: [2023-05-10 12:37:40,766] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +29: [2023-05-10 12:37:40,766] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt... +17: [2023-05-10 12:37:40,767] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... + 5: [2023-05-10 12:37:40,767] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +15: [2023-05-10 12:37:40,768] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. + 0: [2023-05-10 12:37:40,769] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +28: [2023-05-10 12:37:40,769] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. + 4: [2023-05-10 12:37:40,769] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. + 4: [2023-05-10 12:37:40,769] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. + 0: [2023-05-10 12:37:40,770] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... + 3: [2023-05-10 12:37:40,770] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. + 3: [2023-05-10 12:37:40,770] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... + 0: [2023-05-10 12:37:40,770] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... + 4: [2023-05-10 12:37:40,770] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. + 3: [2023-05-10 12:37:40,771] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +22: [2023-05-10 12:37:40,772] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. + 4: [2023-05-10 12:37:40,772] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +22: [2023-05-10 12:37:40,772] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +22: [2023-05-10 12:37:40,772] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +22: [2023-05-10 12:37:40,772] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +22: [2023-05-10 12:37:40,772] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. + 5: [2023-05-10 12:37:40,772] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +22: [2023-05-10 12:37:40,772] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. + 5: [2023-05-10 12:37:40,772] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +22: [2023-05-10 12:37:40,772] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt... +22: [2023-05-10 12:37:40,772] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +22: [2023-05-10 12:37:40,772] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +22: [2023-05-10 12:37:40,772] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +22: [2023-05-10 12:37:40,772] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt... +22: [2023-05-10 12:37:40,772] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt... +22: [2023-05-10 12:37:40,772] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt... +22: [2023-05-10 12:37:40,772] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +22: [2023-05-10 12:37:40,772] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +27: [2023-05-10 12:37:40,773] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +18: [2023-05-10 12:37:40,773] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... + 3: [2023-05-10 12:37:40,773] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. + 3: [2023-05-10 12:37:40,773] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... + 3: [2023-05-10 12:37:40,773] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +23: [2023-05-10 12:37:40,773] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +18: [2023-05-10 12:37:40,773] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +23: [2023-05-10 12:37:40,773] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +18: [2023-05-10 12:37:40,773] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +23: [2023-05-10 12:37:40,773] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +23: [2023-05-10 12:37:40,773] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +23: [2023-05-10 12:37:40,773] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +23: [2023-05-10 12:37:40,774] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +22: [2023-05-10 12:37:40,774] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +23: [2023-05-10 12:37:40,774] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +23: [2023-05-10 12:37:40,774] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +28: [2023-05-10 12:37:40,774] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +28: [2023-05-10 12:37:40,774] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +27: [2023-05-10 12:37:40,774] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... + 3: [2023-05-10 12:37:40,774] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +15: [2023-05-10 12:37:40,775] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +19: [2023-05-10 12:37:40,775] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. + 5: [2023-05-10 12:37:40,775] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. + 3: [2023-05-10 12:37:40,776] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +19: [2023-05-10 12:37:40,776] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +18: [2023-05-10 12:37:40,776] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. +29: [2023-05-10 12:37:40,777] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +29: [2023-05-10 12:37:40,777] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +15: [2023-05-10 12:37:40,777] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +10: [2023-05-10 12:37:40,778] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +10: [2023-05-10 12:37:40,779] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +10: [2023-05-10 12:37:40,779] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +10: [2023-05-10 12:37:40,779] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +10: [2023-05-10 12:37:40,779] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +10: [2023-05-10 12:37:40,779] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +10: [2023-05-10 12:37:40,779] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +19: [2023-05-10 12:37:40,779] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +19: [2023-05-10 12:37:40,780] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +28: [2023-05-10 12:37:40,780] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +29: [2023-05-10 12:37:40,781] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +29: [2023-05-10 12:37:40,781] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. + 5: [2023-05-10 12:37:40,782] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... + 4: [2023-05-10 12:37:40,782] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... + 0: [2023-05-10 12:37:40,782] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_00-model_states.pt. + 4: [2023-05-10 12:37:40,783] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... + 4: [2023-05-10 12:37:40,783] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +22: [2023-05-10 12:37:40,783] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. + 3: [2023-05-10 12:37:40,784] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +28: [2023-05-10 12:37:40,785] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... + 5: [2023-05-10 12:37:40,785] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +19: [2023-05-10 12:37:40,785] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +23: [2023-05-10 12:37:40,784] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +23: [2023-05-10 12:37:40,785] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +29: [2023-05-10 12:37:40,785] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +18: [2023-05-10 12:37:40,786] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +19: [2023-05-10 12:37:40,787] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +31: [2023-05-10 12:37:40,787] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +31: [2023-05-10 12:37:40,787] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +31: [2023-05-10 12:37:40,787] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +31: [2023-05-10 12:37:40,787] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +31: [2023-05-10 12:37:40,787] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +31: [2023-05-10 12:37:40,787] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +31: [2023-05-10 12:37:40,787] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +23: [2023-05-10 12:37:40,787] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +31: [2023-05-10 12:37:40,787] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +23: [2023-05-10 12:37:40,788] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +29: [2023-05-10 12:37:40,788] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +19: [2023-05-10 12:37:40,789] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +19: [2023-05-10 12:37:40,789] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +28: [2023-05-10 12:37:40,789] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. + 3: [2023-05-10 12:37:40,790] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +22: [2023-05-10 12:37:40,790] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +22: [2023-05-10 12:37:40,790] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +29: [2023-05-10 12:37:40,791] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +29: [2023-05-10 12:37:40,791] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... + 0: [2023-05-10 12:37:40,792] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +22: [2023-05-10 12:37:40,795] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... + 3: [2023-05-10 12:37:40,796] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +23: [2023-05-10 12:37:40,796] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +23: [2023-05-10 12:37:40,797] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +23: [2023-05-10 12:37:40,797] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... + 3: [2023-05-10 12:37:40,798] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +22: [2023-05-10 12:37:40,799] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +31: [2023-05-10 12:37:40,798] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +31: [2023-05-10 12:37:40,799] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +28: [2023-05-10 12:37:40,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +22: [2023-05-10 12:37:40,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +23: [2023-05-10 12:37:40,802] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +31: [2023-05-10 12:37:40,802] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +31: [2023-05-10 12:37:40,802] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. + 3: [2023-05-10 12:37:40,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +22: [2023-05-10 12:37:40,806] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +31: [2023-05-10 12:37:40,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +31: [2023-05-10 12:37:40,809] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... + 3: [2023-05-10 12:37:40,810] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +31: [2023-05-10 12:37:40,811] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +31: [2023-05-10 12:37:40,812] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... + 3: [2023-05-10 12:37:40,813] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +30: [2023-05-10 12:37:40,813] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +30: [2023-05-10 12:37:40,813] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +30: [2023-05-10 12:37:40,813] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +30: [2023-05-10 12:37:40,813] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +30: [2023-05-10 12:37:40,813] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +30: [2023-05-10 12:37:40,813] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +30: [2023-05-10 12:37:40,813] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +30: [2023-05-10 12:37:40,813] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +22: [2023-05-10 12:37:40,815] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... + 3: [2023-05-10 12:37:40,819] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +10: [2023-05-10 12:37:40,780] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +10: [2023-05-10 12:37:40,790] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +10: [2023-05-10 12:37:40,798] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +10: [2023-05-10 12:37:40,799] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +10: [2023-05-10 12:37:40,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +10: [2023-05-10 12:37:40,806] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +10: [2023-05-10 12:37:40,808] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +10: [2023-05-10 12:37:40,809] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +10: [2023-05-10 12:37:40,815] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +30: [2023-05-10 12:37:40,824] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +30: [2023-05-10 12:37:40,830] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +30: [2023-05-10 12:37:40,831] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +30: [2023-05-10 12:37:40,831] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +30: [2023-05-10 12:37:40,833] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +30: [2023-05-10 12:37:40,840] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +30: [2023-05-10 12:37:40,841] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +30: [2023-05-10 12:37:40,842] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... + 6: [2023-05-10 12:37:40,856] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. + 6: [2023-05-10 12:37:40,856] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. + 6: [2023-05-10 12:37:40,856] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. + 6: [2023-05-10 12:37:40,856] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. + 6: [2023-05-10 12:37:40,856] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. + 6: [2023-05-10 12:37:40,856] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. + 6: [2023-05-10 12:37:40,856] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. + 6: [2023-05-10 12:37:40,856] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... + 6: [2023-05-10 12:37:40,856] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... + 6: [2023-05-10 12:37:40,856] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... + 6: [2023-05-10 12:37:40,856] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. + 6: [2023-05-10 12:37:40,856] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... + 6: [2023-05-10 12:37:40,856] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt... + 6: [2023-05-10 12:37:40,856] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt... + 6: [2023-05-10 12:37:40,856] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt... + 6: [2023-05-10 12:37:40,857] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt... + 6: [2023-05-10 12:37:40,872] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. + 6: [2023-05-10 12:37:40,872] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. + 6: [2023-05-10 12:37:40,873] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. + 6: [2023-05-10 12:37:40,873] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +26: [2023-05-10 12:37:40,880] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +26: [2023-05-10 12:37:40,881] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +26: [2023-05-10 12:37:40,881] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +26: [2023-05-10 12:37:40,881] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +26: [2023-05-10 12:37:40,881] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +26: [2023-05-10 12:37:40,881] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +16: [2023-05-10 12:37:40,882] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. + 6: [2023-05-10 12:37:40,882] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +16: [2023-05-10 12:37:40,882] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +16: [2023-05-10 12:37:40,882] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +26: [2023-05-10 12:37:40,882] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +16: [2023-05-10 12:37:40,882] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +16: [2023-05-10 12:37:40,882] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +26: [2023-05-10 12:37:40,882] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +16: [2023-05-10 12:37:40,882] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +16: [2023-05-10 12:37:40,882] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +16: [2023-05-10 12:37:40,882] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... + 6: [2023-05-10 12:37:40,885] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... + 6: [2023-05-10 12:37:40,885] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... + 6: [2023-05-10 12:37:40,886] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... + 2: [2023-05-10 12:37:40,888] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. + 2: [2023-05-10 12:37:40,888] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. + 2: [2023-05-10 12:37:40,888] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. + 2: [2023-05-10 12:37:40,889] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... + 2: [2023-05-10 12:37:40,889] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... + 2: [2023-05-10 12:37:40,889] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. + 1: [2023-05-10 12:37:40,891] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. + 1: [2023-05-10 12:37:40,891] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. + 1: [2023-05-10 12:37:40,891] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. + 1: [2023-05-10 12:37:40,891] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... + 1: [2023-05-10 12:37:40,891] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... + 1: [2023-05-10 12:37:40,891] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... + 2: [2023-05-10 12:37:40,891] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... + 7: [2023-05-10 12:37:40,891] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. + 7: [2023-05-10 12:37:40,891] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +26: [2023-05-10 12:37:40,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. + 7: [2023-05-10 12:37:40,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. + 7: [2023-05-10 12:37:40,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. + 7: [2023-05-10 12:37:40,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. + 7: [2023-05-10 12:37:40,892] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... + 7: [2023-05-10 12:37:40,892] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... + 7: [2023-05-10 12:37:40,892] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... + 1: [2023-05-10 12:37:40,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. + 2: [2023-05-10 12:37:40,893] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +16: [2023-05-10 12:37:40,893] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +26: [2023-05-10 12:37:40,894] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. + 8: [2023-05-10 12:37:40,894] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. + 8: [2023-05-10 12:37:40,894] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... + 8: [2023-05-10 12:37:40,894] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. + 8: [2023-05-10 12:37:40,894] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. + 8: [2023-05-10 12:37:40,894] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. + 8: [2023-05-10 12:37:40,894] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... + 8: [2023-05-10 12:37:40,894] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... + 8: [2023-05-10 12:37:40,894] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... + 1: [2023-05-10 12:37:40,895] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +16: [2023-05-10 12:37:40,895] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +26: [2023-05-10 12:37:40,896] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +26: [2023-05-10 12:37:40,897] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +16: [2023-05-10 12:37:40,897] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +16: [2023-05-10 12:37:40,897] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +14: [2023-05-10 12:37:40,899] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +14: [2023-05-10 12:37:40,899] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +14: [2023-05-10 12:37:40,899] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +14: [2023-05-10 12:37:40,899] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +14: [2023-05-10 12:37:40,899] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +14: [2023-05-10 12:37:40,899] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +14: [2023-05-10 12:37:40,899] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +14: [2023-05-10 12:37:40,899] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... + 2: [2023-05-10 12:37:40,901] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +26: [2023-05-10 12:37:40,902] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... + 2: [2023-05-10 12:37:40,902] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. + 7: [2023-05-10 12:37:40,902] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +26: [2023-05-10 12:37:40,903] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +21: [2023-05-10 12:37:40,904] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +21: [2023-05-10 12:37:40,904] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +21: [2023-05-10 12:37:40,904] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +21: [2023-05-10 12:37:40,904] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +21: [2023-05-10 12:37:40,904] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +21: [2023-05-10 12:37:40,904] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +15: [2023-05-10 12:37:40,904] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +17: [2023-05-10 12:37:40,904] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +17: [2023-05-10 12:37:40,904] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +15: [2023-05-10 12:37:40,904] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +21: [2023-05-10 12:37:40,904] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +21: [2023-05-10 12:37:40,904] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +15: [2023-05-10 12:37:40,904] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +15: [2023-05-10 12:37:40,904] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +15: [2023-05-10 12:37:40,904] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +15: [2023-05-10 12:37:40,905] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +17: [2023-05-10 12:37:40,904] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +15: [2023-05-10 12:37:40,905] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +17: [2023-05-10 12:37:40,905] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +15: [2023-05-10 12:37:40,905] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +16: [2023-05-10 12:37:40,905] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... + 8: [2023-05-10 12:37:40,905] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +17: [2023-05-10 12:37:40,905] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +17: [2023-05-10 12:37:40,905] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. + 1: [2023-05-10 12:37:40,906] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. + 1: [2023-05-10 12:37:40,906] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. + 1: [2023-05-10 12:37:40,906] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +16: [2023-05-10 12:37:40,906] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +16: [2023-05-10 12:37:40,906] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +24: [2023-05-10 12:37:40,906] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +17: [2023-05-10 12:37:40,907] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +24: [2023-05-10 12:37:40,906] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +24: [2023-05-10 12:37:40,907] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +24: [2023-05-10 12:37:40,907] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +17: [2023-05-10 12:37:40,907] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +26: [2023-05-10 12:37:40,907] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +26: [2023-05-10 12:37:40,908] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +24: [2023-05-10 12:37:40,908] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +24: [2023-05-10 12:37:40,908] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +24: [2023-05-10 12:37:40,909] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +24: [2023-05-10 12:37:40,909] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +11: [2023-05-10 12:37:40,909] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +11: [2023-05-10 12:37:40,909] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +11: [2023-05-10 12:37:40,909] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +11: [2023-05-10 12:37:40,909] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +11: [2023-05-10 12:37:40,909] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +11: [2023-05-10 12:37:40,909] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +11: [2023-05-10 12:37:40,911] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +11: [2023-05-10 12:37:40,911] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +16: [2023-05-10 12:37:40,911] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... + 7: [2023-05-10 12:37:40,911] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. + 7: [2023-05-10 12:37:40,911] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +14: [2023-05-10 12:37:40,912] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +14: [2023-05-10 12:37:40,912] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. + 7: [2023-05-10 12:37:40,912] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. + 7: [2023-05-10 12:37:40,913] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... + 8: [2023-05-10 12:37:40,913] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. + 8: [2023-05-10 12:37:40,913] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +14: [2023-05-10 12:37:40,913] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +14: [2023-05-10 12:37:40,913] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. + 8: [2023-05-10 12:37:40,914] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... + 2: [2023-05-10 12:37:40,915] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +17: [2023-05-10 12:37:40,916] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. + 1: [2023-05-10 12:37:40,916] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +15: [2023-05-10 12:37:40,917] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +21: [2023-05-10 12:37:40,917] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. + 2: [2023-05-10 12:37:40,918] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... + 1: [2023-05-10 12:37:40,918] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +21: [2023-05-10 12:37:40,918] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +24: [2023-05-10 12:37:40,918] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. + 2: [2023-05-10 12:37:40,918] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. + 1: [2023-05-10 12:37:40,919] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +17: [2023-05-10 12:37:40,920] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. + 8: [2023-05-10 12:37:40,920] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +21: [2023-05-10 12:37:40,920] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +21: [2023-05-10 12:37:40,920] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +24: [2023-05-10 12:37:40,921] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +24: [2023-05-10 12:37:40,921] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. + 7: [2023-05-10 12:37:40,922] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +14: [2023-05-10 12:37:40,922] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +15: [2023-05-10 12:37:40,922] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +24: [2023-05-10 12:37:40,922] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +15: [2023-05-10 12:37:40,923] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +15: [2023-05-10 12:37:40,923] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. + 7: [2023-05-10 12:37:40,923] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +14: [2023-05-10 12:37:40,923] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... + 7: [2023-05-10 12:37:40,923] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +11: [2023-05-10 12:37:40,924] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +11: [2023-05-10 12:37:40,924] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +14: [2023-05-10 12:37:40,924] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +14: [2023-05-10 12:37:40,924] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... + 8: [2023-05-10 12:37:40,925] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... + 8: [2023-05-10 12:37:40,925] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +15: [2023-05-10 12:37:40,925] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... + 1: [2023-05-10 12:37:40,926] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +17: [2023-05-10 12:37:40,926] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... + 2: [2023-05-10 12:37:40,928] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +17: [2023-05-10 12:37:40,929] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... + 8: [2023-05-10 12:37:40,930] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +24: [2023-05-10 12:37:40,930] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +24: [2023-05-10 12:37:40,930] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... + 2: [2023-05-10 12:37:40,931] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +24: [2023-05-10 12:37:40,932] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +24: [2023-05-10 12:37:40,932] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +17: [2023-05-10 12:37:40,932] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +21: [2023-05-10 12:37:40,933] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +21: [2023-05-10 12:37:40,934] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +15: [2023-05-10 12:37:40,934] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +21: [2023-05-10 12:37:40,934] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +11: [2023-05-10 12:37:40,934] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +15: [2023-05-10 12:37:40,934] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... + 1: [2023-05-10 12:37:40,935] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +15: [2023-05-10 12:37:40,935] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +11: [2023-05-10 12:37:40,935] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +17: [2023-05-10 12:37:40,936] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +11: [2023-05-10 12:37:40,936] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +21: [2023-05-10 12:37:40,937] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +11: [2023-05-10 12:37:40,939] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +17: [2023-05-10 12:37:40,941] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... + 2: [2023-05-10 12:37:40,941] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +17: [2023-05-10 12:37:40,945] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +11: [2023-05-10 12:37:40,948] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +13: [2023-05-10 12:37:40,948] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +13: [2023-05-10 12:37:40,948] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +27: [2023-05-10 12:37:40,948] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +27: [2023-05-10 12:37:40,948] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +13: [2023-05-10 12:37:40,948] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +27: [2023-05-10 12:37:40,948] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +27: [2023-05-10 12:37:40,949] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +13: [2023-05-10 12:37:40,948] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +13: [2023-05-10 12:37:40,949] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +13: [2023-05-10 12:37:40,949] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +13: [2023-05-10 12:37:40,949] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +27: [2023-05-10 12:37:40,950] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +27: [2023-05-10 12:37:40,950] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +27: [2023-05-10 12:37:40,950] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +27: [2023-05-10 12:37:40,950] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +13: [2023-05-10 12:37:40,951] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +11: [2023-05-10 12:37:40,951] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... + 9: [2023-05-10 12:37:40,958] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. + 9: [2023-05-10 12:37:40,958] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... + 9: [2023-05-10 12:37:40,958] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. + 9: [2023-05-10 12:37:40,958] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. + 9: [2023-05-10 12:37:40,958] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... + 9: [2023-05-10 12:37:40,958] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. + 9: [2023-05-10 12:37:40,958] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +13: [2023-05-10 12:37:40,959] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. + 9: [2023-05-10 12:37:40,960] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +27: [2023-05-10 12:37:40,960] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +27: [2023-05-10 12:37:40,962] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +20: [2023-05-10 12:37:40,962] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +20: [2023-05-10 12:37:40,962] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +20: [2023-05-10 12:37:40,962] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +20: [2023-05-10 12:37:40,962] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +20: [2023-05-10 12:37:40,962] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +20: [2023-05-10 12:37:40,962] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +20: [2023-05-10 12:37:40,962] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +27: [2023-05-10 12:37:40,962] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +12: [2023-05-10 12:37:40,963] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +12: [2023-05-10 12:37:40,963] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +12: [2023-05-10 12:37:40,963] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +12: [2023-05-10 12:37:40,963] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +12: [2023-05-10 12:37:40,963] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +12: [2023-05-10 12:37:40,963] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +20: [2023-05-10 12:37:40,964] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +12: [2023-05-10 12:37:40,965] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +25: [2023-05-10 12:37:40,965] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +25: [2023-05-10 12:37:40,966] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +25: [2023-05-10 12:37:40,966] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +25: [2023-05-10 12:37:40,966] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +25: [2023-05-10 12:37:40,966] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +12: [2023-05-10 12:37:40,966] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +25: [2023-05-10 12:37:40,966] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +25: [2023-05-10 12:37:40,966] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +25: [2023-05-10 12:37:40,966] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +13: [2023-05-10 12:37:40,966] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +13: [2023-05-10 12:37:40,966] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +27: [2023-05-10 12:37:40,969] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +13: [2023-05-10 12:37:40,969] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... + 5: [2023-05-10 12:37:40,970] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. + 5: [2023-05-10 12:37:40,970] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +27: [2023-05-10 12:37:40,970] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. + 5: [2023-05-10 12:37:40,970] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... + 5: [2023-05-10 12:37:40,970] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +27: [2023-05-10 12:37:40,970] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... + 9: [2023-05-10 12:37:40,970] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. + 5: [2023-05-10 12:37:40,971] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. + 5: [2023-05-10 12:37:40,971] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. + 9: [2023-05-10 12:37:40,971] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. + 5: [2023-05-10 12:37:40,971] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... + 9: [2023-05-10 12:37:40,972] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. + 5: [2023-05-10 12:37:40,973] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +20: [2023-05-10 12:37:40,975] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +27: [2023-05-10 12:37:40,975] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +20: [2023-05-10 12:37:40,976] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +20: [2023-05-10 12:37:40,976] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +13: [2023-05-10 12:37:40,976] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +25: [2023-05-10 12:37:40,977] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +25: [2023-05-10 12:37:40,977] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +13: [2023-05-10 12:37:40,978] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +12: [2023-05-10 12:37:40,978] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +12: [2023-05-10 12:37:40,978] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +27: [2023-05-10 12:37:40,979] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... + 9: [2023-05-10 12:37:40,980] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +25: [2023-05-10 12:37:40,981] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +25: [2023-05-10 12:37:40,981] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. + 9: [2023-05-10 12:37:40,982] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... + 9: [2023-05-10 12:37:40,982] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +13: [2023-05-10 12:37:40,984] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +20: [2023-05-10 12:37:40,985] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... + 5: [2023-05-10 12:37:40,985] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. + 5: [2023-05-10 12:37:40,985] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. + 5: [2023-05-10 12:37:40,985] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +12: [2023-05-10 12:37:40,986] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +20: [2023-05-10 12:37:40,988] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +20: [2023-05-10 12:37:40,988] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... + 0: [2023-05-10 12:37:40,989] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. + 0: [2023-05-10 12:37:40,989] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. + 0: [2023-05-10 12:37:40,989] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +12: [2023-05-10 12:37:40,989] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. + 0: [2023-05-10 12:37:40,989] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... + 0: [2023-05-10 12:37:40,989] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... + 0: [2023-05-10 12:37:40,989] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +12: [2023-05-10 12:37:40,989] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... + 0: [2023-05-10 12:37:40,989] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. + 0: [2023-05-10 12:37:40,989] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... + 9: [2023-05-10 12:37:40,989] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +25: [2023-05-10 12:37:40,990] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +18: [2023-05-10 12:37:40,990] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +18: [2023-05-10 12:37:40,990] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +18: [2023-05-10 12:37:40,990] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +18: [2023-05-10 12:37:40,990] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +25: [2023-05-10 12:37:40,990] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +18: [2023-05-10 12:37:40,990] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +18: [2023-05-10 12:37:40,990] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +18: [2023-05-10 12:37:40,992] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +18: [2023-05-10 12:37:40,992] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +25: [2023-05-10 12:37:40,992] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +25: [2023-05-10 12:37:40,992] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +13: [2023-05-10 12:37:40,993] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +20: [2023-05-10 12:37:40,993] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. + 5: [2023-05-10 12:37:40,995] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... + 5: [2023-05-10 12:37:40,996] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +12: [2023-05-10 12:37:40,996] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. + 9: [2023-05-10 12:37:40,997] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... + 5: [2023-05-10 12:37:40,997] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +12: [2023-05-10 12:37:40,998] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... + 5: [2023-05-10 12:37:40,999] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +20: [2023-05-10 12:37:41,001] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +12: [2023-05-10 12:37:41,006] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +18: [2023-05-10 12:37:41,007] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. + 5: [2023-05-10 12:37:41,008] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +22: [2023-05-10 12:37:41,008] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt. +22: [2023-05-10 12:37:41,008] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt. +22: [2023-05-10 12:37:41,008] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt. +22: [2023-05-10 12:37:41,008] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt. +29: [2023-05-10 12:37:41,009] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt. +29: [2023-05-10 12:37:41,009] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt. +29: [2023-05-10 12:37:41,009] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt. +29: [2023-05-10 12:37:41,009] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt. + 0: [2023-05-10 12:37:41,012] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. + 0: [2023-05-10 12:37:41,012] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. + 0: [2023-05-10 12:37:41,012] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. + 0: [2023-05-10 12:37:41,012] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +18: [2023-05-10 12:37:41,013] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +22: [2023-05-10 12:37:41,017] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +22: [2023-05-10 12:37:41,018] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +18: [2023-05-10 12:37:41,018] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +29: [2023-05-10 12:37:41,019] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +29: [2023-05-10 12:37:41,019] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +22: [2023-05-10 12:37:41,019] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +22: [2023-05-10 12:37:41,019] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +29: [2023-05-10 12:37:41,021] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +29: [2023-05-10 12:37:41,022] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... + 0: [2023-05-10 12:37:41,022] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +18: [2023-05-10 12:37:41,023] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... + 0: [2023-05-10 12:37:41,023] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... + 0: [2023-05-10 12:37:41,023] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... + 0: [2023-05-10 12:37:41,024] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +18: [2023-05-10 12:37:41,028] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +18: [2023-05-10 12:37:41,028] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. + 6: [2023-05-10 12:37:41,033] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt. + 6: [2023-05-10 12:37:41,033] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt. + 6: [2023-05-10 12:37:41,033] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt. + 6: [2023-05-10 12:37:41,033] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt. +18: [2023-05-10 12:37:41,037] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +19: [2023-05-10 12:37:41,039] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +19: [2023-05-10 12:37:41,039] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +18: [2023-05-10 12:37:41,039] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +19: [2023-05-10 12:37:41,040] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +19: [2023-05-10 12:37:41,040] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... + 6: [2023-05-10 12:37:41,042] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... + 6: [2023-05-10 12:37:41,042] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... + 6: [2023-05-10 12:37:41,042] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +19: [2023-05-10 12:37:41,044] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +19: [2023-05-10 12:37:41,044] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. + 6: [2023-05-10 12:37:41,044] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +19: [2023-05-10 12:37:41,046] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +19: [2023-05-10 12:37:41,046] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +19: [2023-05-10 12:37:41,051] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +19: [2023-05-10 12:37:41,053] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +28: [2023-05-10 12:37:41,056] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +28: [2023-05-10 12:37:41,056] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +28: [2023-05-10 12:37:41,057] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +28: [2023-05-10 12:37:41,058] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +28: [2023-05-10 12:37:41,058] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +28: [2023-05-10 12:37:41,058] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +28: [2023-05-10 12:37:41,059] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +19: [2023-05-10 12:37:41,060] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +28: [2023-05-10 12:37:41,061] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +29: [2023-05-10 12:37:41,063] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +29: [2023-05-10 12:37:41,063] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +29: [2023-05-10 12:37:41,063] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +29: [2023-05-10 12:37:41,063] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +29: [2023-05-10 12:37:41,063] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +29: [2023-05-10 12:37:41,063] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +29: [2023-05-10 12:37:41,063] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +29: [2023-05-10 12:37:41,063] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +29: [2023-05-10 12:37:41,063] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +29: [2023-05-10 12:37:41,064] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +29: [2023-05-10 12:37:41,064] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt... +29: [2023-05-10 12:37:41,064] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt... +19: [2023-05-10 12:37:41,064] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +29: [2023-05-10 12:37:41,065] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +29: [2023-05-10 12:37:41,065] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +29: [2023-05-10 12:37:41,065] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt... +29: [2023-05-10 12:37:41,066] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt... +22: [2023-05-10 12:37:41,067] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +22: [2023-05-10 12:37:41,067] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +22: [2023-05-10 12:37:41,067] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +22: [2023-05-10 12:37:41,067] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +22: [2023-05-10 12:37:41,068] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt... +22: [2023-05-10 12:37:41,068] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +22: [2023-05-10 12:37:41,068] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +22: [2023-05-10 12:37:41,068] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +22: [2023-05-10 12:37:41,068] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +22: [2023-05-10 12:37:41,068] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +22: [2023-05-10 12:37:41,068] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +22: [2023-05-10 12:37:41,068] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +22: [2023-05-10 12:37:41,069] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +22: [2023-05-10 12:37:41,070] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt... +22: [2023-05-10 12:37:41,070] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt... +22: [2023-05-10 12:37:41,070] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt... +19: [2023-05-10 12:37:41,072] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt. +19: [2023-05-10 12:37:41,072] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt. +19: [2023-05-10 12:37:41,072] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt. +19: [2023-05-10 12:37:41,072] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt. +19: [2023-05-10 12:37:41,073] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +19: [2023-05-10 12:37:41,074] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +28: [2023-05-10 12:37:41,074] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +28: [2023-05-10 12:37:41,075] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +29: [2023-05-10 12:37:41,074] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +29: [2023-05-10 12:37:41,077] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +22: [2023-05-10 12:37:41,079] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +19: [2023-05-10 12:37:41,082] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +28: [2023-05-10 12:37:41,082] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +29: [2023-05-10 12:37:41,083] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +22: [2023-05-10 12:37:41,085] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +19: [2023-05-10 12:37:41,085] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +22: [2023-05-10 12:37:41,085] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +19: [2023-05-10 12:37:41,085] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +19: [2023-05-10 12:37:41,086] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +19: [2023-05-10 12:37:41,086] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +19: [2023-05-10 12:37:41,086] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +28: [2023-05-10 12:37:41,087] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +28: [2023-05-10 12:37:41,087] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +29: [2023-05-10 12:37:41,088] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +28: [2023-05-10 12:37:41,089] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +29: [2023-05-10 12:37:41,089] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +22: [2023-05-10 12:37:41,090] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +29: [2023-05-10 12:37:41,091] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +28: [2023-05-10 12:37:41,093] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +22: [2023-05-10 12:37:41,094] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +19: [2023-05-10 12:37:41,095] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +22: [2023-05-10 12:37:41,096] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +19: [2023-05-10 12:37:41,096] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt... +29: [2023-05-10 12:37:41,098] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +28: [2023-05-10 12:37:41,098] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +19: [2023-05-10 12:37:41,099] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +19: [2023-05-10 12:37:41,099] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt... +29: [2023-05-10 12:37:41,101] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +19: [2023-05-10 12:37:41,101] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +19: [2023-05-10 12:37:41,102] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt... +22: [2023-05-10 12:37:41,105] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +19: [2023-05-10 12:37:41,107] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +19: [2023-05-10 12:37:41,107] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt... +22: [2023-05-10 12:37:41,114] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +31: [2023-05-10 12:37:41,124] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +31: [2023-05-10 12:37:41,124] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +31: [2023-05-10 12:37:41,124] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +31: [2023-05-10 12:37:41,124] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +31: [2023-05-10 12:37:41,125] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +31: [2023-05-10 12:37:41,125] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +31: [2023-05-10 12:37:41,125] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +31: [2023-05-10 12:37:41,126] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +17: [2023-05-10 12:37:41,134] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +17: [2023-05-10 12:37:41,134] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +17: [2023-05-10 12:37:41,134] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +17: [2023-05-10 12:37:41,134] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +17: [2023-05-10 12:37:41,135] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +17: [2023-05-10 12:37:41,135] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +31: [2023-05-10 12:37:41,136] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +17: [2023-05-10 12:37:41,136] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +17: [2023-05-10 12:37:41,137] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +31: [2023-05-10 12:37:41,138] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +31: [2023-05-10 12:37:41,138] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +31: [2023-05-10 12:37:41,145] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +17: [2023-05-10 12:37:41,145] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +17: [2023-05-10 12:37:41,147] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +31: [2023-05-10 12:37:41,148] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +31: [2023-05-10 12:37:41,148] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +31: [2023-05-10 12:37:41,153] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +17: [2023-05-10 12:37:41,153] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +17: [2023-05-10 12:37:41,156] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +17: [2023-05-10 12:37:41,159] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +31: [2023-05-10 12:37:41,161] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +17: [2023-05-10 12:37:41,163] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +10: [2023-05-10 12:37:41,164] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +10: [2023-05-10 12:37:41,164] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +10: [2023-05-10 12:37:41,164] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +10: [2023-05-10 12:37:41,164] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +10: [2023-05-10 12:37:41,164] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +10: [2023-05-10 12:37:41,165] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +10: [2023-05-10 12:37:41,166] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +10: [2023-05-10 12:37:41,166] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +17: [2023-05-10 12:37:41,169] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +17: [2023-05-10 12:37:41,172] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... + 4: [2023-05-10 12:37:41,180] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. + 4: [2023-05-10 12:37:41,180] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. + 4: [2023-05-10 12:37:41,180] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. + 4: [2023-05-10 12:37:41,180] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... + 4: [2023-05-10 12:37:41,180] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. + 4: [2023-05-10 12:37:41,180] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +10: [2023-05-10 12:37:41,181] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +10: [2023-05-10 12:37:41,181] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. + 4: [2023-05-10 12:37:41,181] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... + 4: [2023-05-10 12:37:41,182] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... + 3: [2023-05-10 12:37:41,185] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. + 3: [2023-05-10 12:37:41,185] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... + 3: [2023-05-10 12:37:41,186] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. + 3: [2023-05-10 12:37:41,186] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. + 3: [2023-05-10 12:37:41,186] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. + 3: [2023-05-10 12:37:41,186] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... + 3: [2023-05-10 12:37:41,186] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... + 3: [2023-05-10 12:37:41,186] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +10: [2023-05-10 12:37:41,189] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +10: [2023-05-10 12:37:41,190] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +10: [2023-05-10 12:37:41,190] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... + 4: [2023-05-10 12:37:41,192] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +30: [2023-05-10 12:37:41,194] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt. +30: [2023-05-10 12:37:41,194] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt. +30: [2023-05-10 12:37:41,194] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt. + 4: [2023-05-10 12:37:41,194] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +30: [2023-05-10 12:37:41,194] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt. + 3: [2023-05-10 12:37:41,196] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +10: [2023-05-10 12:37:41,197] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +10: [2023-05-10 12:37:41,198] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +14: [2023-05-10 12:37:41,199] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt. +14: [2023-05-10 12:37:41,199] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt. +14: [2023-05-10 12:37:41,199] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt. +14: [2023-05-10 12:37:41,199] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt. + 4: [2023-05-10 12:37:41,200] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... + 4: [2023-05-10 12:37:41,204] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... + 3: [2023-05-10 12:37:41,204] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +30: [2023-05-10 12:37:41,204] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +30: [2023-05-10 12:37:41,204] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... + 3: [2023-05-10 12:37:41,206] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. + 3: [2023-05-10 12:37:41,206] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +28: [2023-05-10 12:37:41,206] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt. +28: [2023-05-10 12:37:41,206] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt. +28: [2023-05-10 12:37:41,206] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt. +28: [2023-05-10 12:37:41,206] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt. +30: [2023-05-10 12:37:41,206] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +10: [2023-05-10 12:37:41,207] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... + 3: [2023-05-10 12:37:41,207] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +30: [2023-05-10 12:37:41,207] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +14: [2023-05-10 12:37:41,209] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +14: [2023-05-10 12:37:41,209] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +14: [2023-05-10 12:37:41,209] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +14: [2023-05-10 12:37:41,209] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... + 4: [2023-05-10 12:37:41,211] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. + 4: [2023-05-10 12:37:41,215] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +30: [2023-05-10 12:37:41,215] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +28: [2023-05-10 12:37:41,216] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +30: [2023-05-10 12:37:41,216] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt... +28: [2023-05-10 12:37:41,216] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... + 3: [2023-05-10 12:37:41,216] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... + 3: [2023-05-10 12:37:41,216] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +28: [2023-05-10 12:37:41,216] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +28: [2023-05-10 12:37:41,217] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... + 3: [2023-05-10 12:37:41,218] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +30: [2023-05-10 12:37:41,218] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +30: [2023-05-10 12:37:41,218] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt... +14: [2023-05-10 12:37:41,220] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +14: [2023-05-10 12:37:41,221] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt... +30: [2023-05-10 12:37:41,221] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +30: [2023-05-10 12:37:41,221] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt... +14: [2023-05-10 12:37:41,221] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +14: [2023-05-10 12:37:41,221] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt... + 4: [2023-05-10 12:37:41,221] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +30: [2023-05-10 12:37:41,223] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +30: [2023-05-10 12:37:41,223] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt... +14: [2023-05-10 12:37:41,224] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +14: [2023-05-10 12:37:41,224] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +14: [2023-05-10 12:37:41,224] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt... +14: [2023-05-10 12:37:41,224] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt... + 4: [2023-05-10 12:37:41,225] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +28: [2023-05-10 12:37:41,228] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +28: [2023-05-10 12:37:41,228] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt... +28: [2023-05-10 12:37:41,230] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +28: [2023-05-10 12:37:41,230] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt... + 1: [2023-05-10 12:37:41,232] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. + 1: [2023-05-10 12:37:41,233] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... + 1: [2023-05-10 12:37:41,233] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +28: [2023-05-10 12:37:41,234] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +28: [2023-05-10 12:37:41,234] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt... + 1: [2023-05-10 12:37:41,235] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. + 1: [2023-05-10 12:37:41,235] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. + 1: [2023-05-10 12:37:41,235] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... + 1: [2023-05-10 12:37:41,235] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +28: [2023-05-10 12:37:41,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +28: [2023-05-10 12:37:41,236] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt... + 1: [2023-05-10 12:37:41,236] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +23: [2023-05-10 12:37:41,239] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +23: [2023-05-10 12:37:41,239] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +23: [2023-05-10 12:37:41,239] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +23: [2023-05-10 12:37:41,239] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +23: [2023-05-10 12:37:41,240] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +23: [2023-05-10 12:37:41,240] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +23: [2023-05-10 12:37:41,240] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +23: [2023-05-10 12:37:41,241] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +30: [2023-05-10 12:37:41,242] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +30: [2023-05-10 12:37:41,242] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +30: [2023-05-10 12:37:41,242] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +30: [2023-05-10 12:37:41,242] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +30: [2023-05-10 12:37:41,243] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +30: [2023-05-10 12:37:41,243] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +30: [2023-05-10 12:37:41,244] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +30: [2023-05-10 12:37:41,244] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... + 1: [2023-05-10 12:37:41,246] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. + 1: [2023-05-10 12:37:41,248] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +23: [2023-05-10 12:37:41,252] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +23: [2023-05-10 12:37:41,252] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +23: [2023-05-10 12:37:41,252] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +30: [2023-05-10 12:37:41,253] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. + 1: [2023-05-10 12:37:41,255] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +19: [2023-05-10 12:37:41,256] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt. +19: [2023-05-10 12:37:41,256] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt. +19: [2023-05-10 12:37:41,257] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt. +19: [2023-05-10 12:37:41,257] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt. +30: [2023-05-10 12:37:41,257] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. + 7: [2023-05-10 12:37:41,258] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. + 7: [2023-05-10 12:37:41,258] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. + 7: [2023-05-10 12:37:41,259] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... + 7: [2023-05-10 12:37:41,259] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... + 1: [2023-05-10 12:37:41,260] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. + 7: [2023-05-10 12:37:41,261] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +23: [2023-05-10 12:37:41,261] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... + 7: [2023-05-10 12:37:41,262] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +30: [2023-05-10 12:37:41,262] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... + 7: [2023-05-10 12:37:41,262] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +23: [2023-05-10 12:37:41,262] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... + 1: [2023-05-10 12:37:41,262] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +23: [2023-05-10 12:37:41,262] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... + 7: [2023-05-10 12:37:41,263] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +19: [2023-05-10 12:37:41,266] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +23: [2023-05-10 12:37:41,267] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +30: [2023-05-10 12:37:41,267] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +19: [2023-05-10 12:37:41,267] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +19: [2023-05-10 12:37:41,268] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... + 1: [2023-05-10 12:37:41,269] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +19: [2023-05-10 12:37:41,269] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... + 1: [2023-05-10 12:37:41,270] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +30: [2023-05-10 12:37:41,272] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +30: [2023-05-10 12:37:41,273] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +23: [2023-05-10 12:37:41,276] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... + 7: [2023-05-10 12:37:41,277] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. + 7: [2023-05-10 12:37:41,277] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. + 1: [2023-05-10 12:37:41,278] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +19: [2023-05-10 12:37:41,281] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +19: [2023-05-10 12:37:41,282] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt... +30: [2023-05-10 12:37:41,282] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +30: [2023-05-10 12:37:41,282] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +19: [2023-05-10 12:37:41,283] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +19: [2023-05-10 12:37:41,283] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt... +19: [2023-05-10 12:37:41,284] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +19: [2023-05-10 12:37:41,284] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt... + 7: [2023-05-10 12:37:41,286] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. + 7: [2023-05-10 12:37:41,289] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... + 7: [2023-05-10 12:37:41,289] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +19: [2023-05-10 12:37:41,295] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. + 7: [2023-05-10 12:37:41,295] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +19: [2023-05-10 12:37:41,296] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt... + 7: [2023-05-10 12:37:41,297] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. + 7: [2023-05-10 12:37:41,305] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +26: [2023-05-10 12:37:41,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt. +26: [2023-05-10 12:37:41,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt. +26: [2023-05-10 12:37:41,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt. +26: [2023-05-10 12:37:41,310] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt. + 9: [2023-05-10 12:37:41,313] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. + 9: [2023-05-10 12:37:41,313] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... + 9: [2023-05-10 12:37:41,313] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. + 9: [2023-05-10 12:37:41,313] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... + 9: [2023-05-10 12:37:41,314] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. + 9: [2023-05-10 12:37:41,314] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. + 9: [2023-05-10 12:37:41,315] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... + 9: [2023-05-10 12:37:41,315] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +26: [2023-05-10 12:37:41,319] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +26: [2023-05-10 12:37:41,319] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +26: [2023-05-10 12:37:41,320] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +26: [2023-05-10 12:37:41,320] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... + 5: [2023-05-10 12:37:41,323] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. + 5: [2023-05-10 12:37:41,323] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... + 5: [2023-05-10 12:37:41,323] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. + 5: [2023-05-10 12:37:41,325] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... + 5: [2023-05-10 12:37:41,325] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. + 5: [2023-05-10 12:37:41,325] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. + 5: [2023-05-10 12:37:41,325] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... + 9: [2023-05-10 12:37:41,326] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. + 9: [2023-05-10 12:37:41,326] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. + 5: [2023-05-10 12:37:41,326] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +26: [2023-05-10 12:37:41,331] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +26: [2023-05-10 12:37:41,332] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt... + 9: [2023-05-10 12:37:41,335] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +12: [2023-05-10 12:37:41,335] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +12: [2023-05-10 12:37:41,335] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +12: [2023-05-10 12:37:41,336] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +12: [2023-05-10 12:37:41,336] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +12: [2023-05-10 12:37:41,336] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +12: [2023-05-10 12:37:41,336] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +12: [2023-05-10 12:37:41,337] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +26: [2023-05-10 12:37:41,337] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +26: [2023-05-10 12:37:41,337] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt... +12: [2023-05-10 12:37:41,338] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... + 9: [2023-05-10 12:37:41,338] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +26: [2023-05-10 12:37:41,338] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +26: [2023-05-10 12:37:41,338] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +26: [2023-05-10 12:37:41,338] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt... +26: [2023-05-10 12:37:41,338] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt... +24: [2023-05-10 12:37:41,338] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +24: [2023-05-10 12:37:41,338] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +24: [2023-05-10 12:37:41,338] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. + 9: [2023-05-10 12:37:41,339] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +24: [2023-05-10 12:37:41,340] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +24: [2023-05-10 12:37:41,341] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. + 9: [2023-05-10 12:37:41,341] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +24: [2023-05-10 12:37:41,341] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +24: [2023-05-10 12:37:41,341] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. + 5: [2023-05-10 12:37:41,341] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. + 5: [2023-05-10 12:37:41,342] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +24: [2023-05-10 12:37:41,342] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... + 9: [2023-05-10 12:37:41,346] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... + 8: [2023-05-10 12:37:41,346] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. + 8: [2023-05-10 12:37:41,347] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... + 8: [2023-05-10 12:37:41,347] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. + 8: [2023-05-10 12:37:41,347] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +27: [2023-05-10 12:37:41,347] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +27: [2023-05-10 12:37:41,347] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... + 8: [2023-05-10 12:37:41,347] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +27: [2023-05-10 12:37:41,347] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +27: [2023-05-10 12:37:41,347] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +27: [2023-05-10 12:37:41,347] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +27: [2023-05-10 12:37:41,347] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... + 8: [2023-05-10 12:37:41,347] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +27: [2023-05-10 12:37:41,347] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. + 8: [2023-05-10 12:37:41,348] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... + 8: [2023-05-10 12:37:41,348] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +27: [2023-05-10 12:37:41,350] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +31: [2023-05-10 12:37:41,350] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt. +31: [2023-05-10 12:37:41,350] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt. +31: [2023-05-10 12:37:41,350] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt. + 9: [2023-05-10 12:37:41,350] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +31: [2023-05-10 12:37:41,350] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt. +24: [2023-05-10 12:37:41,351] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. + 5: [2023-05-10 12:37:41,351] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +12: [2023-05-10 12:37:41,351] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +12: [2023-05-10 12:37:41,351] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +12: [2023-05-10 12:37:41,351] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. + 5: [2023-05-10 12:37:41,351] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +24: [2023-05-10 12:37:41,352] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. + 5: [2023-05-10 12:37:41,354] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. + 5: [2023-05-10 12:37:41,355] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +29: [2023-05-10 12:37:41,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +29: [2023-05-10 12:37:41,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +29: [2023-05-10 12:37:41,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +29: [2023-05-10 12:37:41,356] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +29: [2023-05-10 12:37:41,356] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +29: [2023-05-10 12:37:41,357] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +29: [2023-05-10 12:37:41,357] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +29: [2023-05-10 12:37:41,358] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +27: [2023-05-10 12:37:41,358] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +28: [2023-05-10 12:37:41,359] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +28: [2023-05-10 12:37:41,359] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +28: [2023-05-10 12:37:41,359] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +28: [2023-05-10 12:37:41,359] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +27: [2023-05-10 12:37:41,359] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +31: [2023-05-10 12:37:41,360] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +28: [2023-05-10 12:37:41,360] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +28: [2023-05-10 12:37:41,360] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +27: [2023-05-10 12:37:41,360] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +28: [2023-05-10 12:37:41,361] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +11: [2023-05-10 12:37:41,361] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +11: [2023-05-10 12:37:41,361] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +11: [2023-05-10 12:37:41,361] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +11: [2023-05-10 12:37:41,361] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +11: [2023-05-10 12:37:41,361] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +11: [2023-05-10 12:37:41,361] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +24: [2023-05-10 12:37:41,361] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +24: [2023-05-10 12:37:41,361] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +28: [2023-05-10 12:37:41,362] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +28: [2023-05-10 12:37:41,362] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt. +28: [2023-05-10 12:37:41,362] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt. +28: [2023-05-10 12:37:41,362] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt. +11: [2023-05-10 12:37:41,362] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +12: [2023-05-10 12:37:41,362] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +31: [2023-05-10 12:37:41,362] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +12: [2023-05-10 12:37:41,362] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +28: [2023-05-10 12:37:41,362] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt. +26: [2023-05-10 12:37:41,362] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +26: [2023-05-10 12:37:41,362] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +26: [2023-05-10 12:37:41,362] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +26: [2023-05-10 12:37:41,363] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +26: [2023-05-10 12:37:41,363] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +31: [2023-05-10 12:37:41,363] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +31: [2023-05-10 12:37:41,363] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +26: [2023-05-10 12:37:41,363] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. + 8: [2023-05-10 12:37:41,363] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. + 8: [2023-05-10 12:37:41,363] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. + 5: [2023-05-10 12:37:41,364] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +11: [2023-05-10 12:37:41,364] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +20: [2023-05-10 12:37:41,364] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +20: [2023-05-10 12:37:41,364] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +20: [2023-05-10 12:37:41,364] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +20: [2023-05-10 12:37:41,364] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +12: [2023-05-10 12:37:41,364] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +15: [2023-05-10 12:37:41,364] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +15: [2023-05-10 12:37:41,364] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +15: [2023-05-10 12:37:41,364] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +12: [2023-05-10 12:37:41,364] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +26: [2023-05-10 12:37:41,365] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +15: [2023-05-10 12:37:41,364] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +15: [2023-05-10 12:37:41,365] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +15: [2023-05-10 12:37:41,365] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +26: [2023-05-10 12:37:41,365] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... + 5: [2023-05-10 12:37:41,365] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +30: [2023-05-10 12:37:41,365] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt. +30: [2023-05-10 12:37:41,365] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt. +30: [2023-05-10 12:37:41,365] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt. +30: [2023-05-10 12:37:41,365] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt. +20: [2023-05-10 12:37:41,366] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +20: [2023-05-10 12:37:41,366] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +20: [2023-05-10 12:37:41,366] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... + 2: [2023-05-10 12:37:41,365] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. + 2: [2023-05-10 12:37:41,365] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. + 2: [2023-05-10 12:37:41,366] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... + 2: [2023-05-10 12:37:41,366] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. + 2: [2023-05-10 12:37:41,366] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... + 6: [2023-05-10 12:37:41,366] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. + 6: [2023-05-10 12:37:41,366] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. + 6: [2023-05-10 12:37:41,366] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. + 6: [2023-05-10 12:37:41,366] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... + 2: [2023-05-10 12:37:41,366] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. + 2: [2023-05-10 12:37:41,366] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +18: [2023-05-10 12:37:41,366] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. + 6: [2023-05-10 12:37:41,366] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. + 6: [2023-05-10 12:37:41,366] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. + 6: [2023-05-10 12:37:41,366] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. + 6: [2023-05-10 12:37:41,366] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... + 6: [2023-05-10 12:37:41,366] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +18: [2023-05-10 12:37:41,366] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. + 6: [2023-05-10 12:37:41,366] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... + 6: [2023-05-10 12:37:41,366] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +15: [2023-05-10 12:37:41,367] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +18: [2023-05-10 12:37:41,366] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... + 6: [2023-05-10 12:37:41,367] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt... + 6: [2023-05-10 12:37:41,367] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt... + 6: [2023-05-10 12:37:41,367] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt... +18: [2023-05-10 12:37:41,367] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +18: [2023-05-10 12:37:41,367] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +13: [2023-05-10 12:37:41,367] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +18: [2023-05-10 12:37:41,367] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +18: [2023-05-10 12:37:41,367] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +13: [2023-05-10 12:37:41,367] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +16: [2023-05-10 12:37:41,367] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +16: [2023-05-10 12:37:41,367] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +16: [2023-05-10 12:37:41,367] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +16: [2023-05-10 12:37:41,367] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +20: [2023-05-10 12:37:41,367] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +13: [2023-05-10 12:37:41,367] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +14: [2023-05-10 12:37:41,367] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +14: [2023-05-10 12:37:41,367] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +25: [2023-05-10 12:37:41,367] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +25: [2023-05-10 12:37:41,367] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +25: [2023-05-10 12:37:41,367] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +27: [2023-05-10 12:37:41,367] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +14: [2023-05-10 12:37:41,367] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +15: [2023-05-10 12:37:41,367] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +25: [2023-05-10 12:37:41,367] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +25: [2023-05-10 12:37:41,367] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +25: [2023-05-10 12:37:41,368] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +29: [2023-05-10 12:37:41,368] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +14: [2023-05-10 12:37:41,368] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +24: [2023-05-10 12:37:41,368] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. + 6: [2023-05-10 12:37:41,368] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... + 0: [2023-05-10 12:37:41,368] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. + 0: [2023-05-10 12:37:41,368] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. + 0: [2023-05-10 12:37:41,368] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. + 0: [2023-05-10 12:37:41,368] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... + 0: [2023-05-10 12:37:41,368] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... + 0: [2023-05-10 12:37:41,368] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +18: [2023-05-10 12:37:41,368] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +24: [2023-05-10 12:37:41,368] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +13: [2023-05-10 12:37:41,368] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. + 6: [2023-05-10 12:37:41,368] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt... +13: [2023-05-10 12:37:41,368] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +13: [2023-05-10 12:37:41,368] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +13: [2023-05-10 12:37:41,368] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +27: [2023-05-10 12:37:41,368] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... + 0: [2023-05-10 12:37:41,368] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +16: [2023-05-10 12:37:41,369] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +16: [2023-05-10 12:37:41,369] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +14: [2023-05-10 12:37:41,369] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +14: [2023-05-10 12:37:41,369] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +25: [2023-05-10 12:37:41,369] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +14: [2023-05-10 12:37:41,369] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +14: [2023-05-10 12:37:41,369] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +13: [2023-05-10 12:37:41,369] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +25: [2023-05-10 12:37:41,369] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +29: [2023-05-10 12:37:41,369] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +27: [2023-05-10 12:37:41,370] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +16: [2023-05-10 12:37:41,370] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +24: [2023-05-10 12:37:41,370] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt. +24: [2023-05-10 12:37:41,370] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt. +24: [2023-05-10 12:37:41,371] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt. +16: [2023-05-10 12:37:41,371] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... + 0: [2023-05-10 12:37:41,371] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... + 2: [2023-05-10 12:37:41,371] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +29: [2023-05-10 12:37:41,371] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. + 8: [2023-05-10 12:37:41,371] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +24: [2023-05-10 12:37:41,371] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt. +28: [2023-05-10 12:37:41,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +22: [2023-05-10 12:37:41,372] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt. + 8: [2023-05-10 12:37:41,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +12: [2023-05-10 12:37:41,373] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +28: [2023-05-10 12:37:41,373] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +26: [2023-05-10 12:37:41,374] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +30: [2023-05-10 12:37:41,374] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +30: [2023-05-10 12:37:41,374] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +28: [2023-05-10 12:37:41,374] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +30: [2023-05-10 12:37:41,374] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +22: [2023-05-10 12:37:41,375] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt. +22: [2023-05-10 12:37:41,375] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt. +26: [2023-05-10 12:37:41,375] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +11: [2023-05-10 12:37:41,375] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +22: [2023-05-10 12:37:41,375] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt. + 8: [2023-05-10 12:37:41,375] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +28: [2023-05-10 12:37:41,376] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +11: [2023-05-10 12:37:41,376] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +11: [2023-05-10 12:37:41,376] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +31: [2023-05-10 12:37:41,376] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +15: [2023-05-10 12:37:41,376] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +31: [2023-05-10 12:37:41,377] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt... +30: [2023-05-10 12:37:41,377] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +29: [2023-05-10 12:37:41,377] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +31: [2023-05-10 12:37:41,378] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +31: [2023-05-10 12:37:41,378] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt... +24: [2023-05-10 12:37:41,378] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +20: [2023-05-10 12:37:41,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +13: [2023-05-10 12:37:41,380] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +15: [2023-05-10 12:37:41,380] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +20: [2023-05-10 12:37:41,380] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +20: [2023-05-10 12:37:41,380] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. + 8: [2023-05-10 12:37:41,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... + 6: [2023-05-10 12:37:41,381] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +24: [2023-05-10 12:37:41,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +24: [2023-05-10 12:37:41,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +27: [2023-05-10 12:37:41,381] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +24: [2023-05-10 12:37:41,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +29: [2023-05-10 12:37:41,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... + 2: [2023-05-10 12:37:41,381] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. + 2: [2023-05-10 12:37:41,381] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. + 6: [2023-05-10 12:37:41,381] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. + 6: [2023-05-10 12:37:41,381] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +28: [2023-05-10 12:37:41,381] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +29: [2023-05-10 12:37:41,383] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt. +29: [2023-05-10 12:37:41,383] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt. +25: [2023-05-10 12:37:41,383] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +25: [2023-05-10 12:37:41,383] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +26: [2023-05-10 12:37:41,383] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +16: [2023-05-10 12:37:41,383] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +16: [2023-05-10 12:37:41,383] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +26: [2023-05-10 12:37:41,383] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +29: [2023-05-10 12:37:41,383] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt. +29: [2023-05-10 12:37:41,383] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +24: [2023-05-10 12:37:41,384] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +24: [2023-05-10 12:37:41,384] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +31: [2023-05-10 12:37:41,384] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +31: [2023-05-10 12:37:41,384] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt... +31: [2023-05-10 12:37:41,384] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +31: [2023-05-10 12:37:41,384] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt... + 8: [2023-05-10 12:37:41,384] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +28: [2023-05-10 12:37:41,384] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +15: [2023-05-10 12:37:41,385] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... + 2: [2023-05-10 12:37:41,385] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +29: [2023-05-10 12:37:41,385] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +29: [2023-05-10 12:37:41,385] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt. +13: [2023-05-10 12:37:41,386] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +13: [2023-05-10 12:37:41,386] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +17: [2023-05-10 12:37:41,387] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +17: [2023-05-10 12:37:41,387] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +17: [2023-05-10 12:37:41,387] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +17: [2023-05-10 12:37:41,387] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +17: [2023-05-10 12:37:41,387] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +17: [2023-05-10 12:37:41,387] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +18: [2023-05-10 12:37:41,387] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +18: [2023-05-10 12:37:41,387] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +18: [2023-05-10 12:37:41,387] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +17: [2023-05-10 12:37:41,387] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +11: [2023-05-10 12:37:41,387] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +17: [2023-05-10 12:37:41,387] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +22: [2023-05-10 12:37:41,387] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +22: [2023-05-10 12:37:41,387] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +22: [2023-05-10 12:37:41,387] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +22: [2023-05-10 12:37:41,387] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +30: [2023-05-10 12:37:41,387] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +20: [2023-05-10 12:37:41,388] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +30: [2023-05-10 12:37:41,388] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt... +14: [2023-05-10 12:37:41,388] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt. +14: [2023-05-10 12:37:41,388] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt. +14: [2023-05-10 12:37:41,388] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt. +13: [2023-05-10 12:37:41,388] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +14: [2023-05-10 12:37:41,389] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt. +20: [2023-05-10 12:37:41,389] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +15: [2023-05-10 12:37:41,389] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... + 6: [2023-05-10 12:37:41,389] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +27: [2023-05-10 12:37:41,390] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... + 0: [2023-05-10 12:37:41,390] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. + 0: [2023-05-10 12:37:41,390] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. + 0: [2023-05-10 12:37:41,390] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. + 6: [2023-05-10 12:37:41,390] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +28: [2023-05-10 12:37:41,391] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +20: [2023-05-10 12:37:41,391] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... + 6: [2023-05-10 12:37:41,391] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +11: [2023-05-10 12:37:41,391] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +11: [2023-05-10 12:37:41,391] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +16: [2023-05-10 12:37:41,391] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +11: [2023-05-10 12:37:41,392] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +25: [2023-05-10 12:37:41,392] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +16: [2023-05-10 12:37:41,392] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +30: [2023-05-10 12:37:41,392] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +28: [2023-05-10 12:37:41,392] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +30: [2023-05-10 12:37:41,392] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt... +20: [2023-05-10 12:37:41,392] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +29: [2023-05-10 12:37:41,392] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +25: [2023-05-10 12:37:41,393] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. + 6: [2023-05-10 12:37:41,393] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +25: [2023-05-10 12:37:41,393] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +30: [2023-05-10 12:37:41,393] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +29: [2023-05-10 12:37:41,393] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... + 8: [2023-05-10 12:37:41,393] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +15: [2023-05-10 12:37:41,393] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +26: [2023-05-10 12:37:41,393] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +14: [2023-05-10 12:37:41,394] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +30: [2023-05-10 12:37:41,394] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt... +29: [2023-05-10 12:37:41,395] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +25: [2023-05-10 12:37:41,395] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +13: [2023-05-10 12:37:41,396] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +13: [2023-05-10 12:37:41,396] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +28: [2023-05-10 12:37:41,396] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +29: [2023-05-10 12:37:41,396] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +29: [2023-05-10 12:37:41,396] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +16: [2023-05-10 12:37:41,396] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +21: [2023-05-10 12:37:41,397] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +21: [2023-05-10 12:37:41,397] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +21: [2023-05-10 12:37:41,397] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +18: [2023-05-10 12:37:41,397] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... + 2: [2023-05-10 12:37:41,397] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +21: [2023-05-10 12:37:41,397] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. + 2: [2023-05-10 12:37:41,397] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +18: [2023-05-10 12:37:41,397] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +28: [2023-05-10 12:37:41,397] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. + 6: [2023-05-10 12:37:41,398] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +31: [2023-05-10 12:37:41,398] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +18: [2023-05-10 12:37:41,398] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +31: [2023-05-10 12:37:41,398] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +24: [2023-05-10 12:37:41,397] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +24: [2023-05-10 12:37:41,398] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +31: [2023-05-10 12:37:41,398] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +31: [2023-05-10 12:37:41,398] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +28: [2023-05-10 12:37:41,398] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt... +31: [2023-05-10 12:37:41,398] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +31: [2023-05-10 12:37:41,398] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... + 2: [2023-05-10 12:37:41,398] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +31: [2023-05-10 12:37:41,398] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +24: [2023-05-10 12:37:41,398] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt... +31: [2023-05-10 12:37:41,398] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +14: [2023-05-10 12:37:41,398] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +24: [2023-05-10 12:37:41,398] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt... +26: [2023-05-10 12:37:41,399] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +14: [2023-05-10 12:37:41,399] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +28: [2023-05-10 12:37:41,399] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +21: [2023-05-10 12:37:41,399] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +17: [2023-05-10 12:37:41,399] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +17: [2023-05-10 12:37:41,399] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +24: [2023-05-10 12:37:41,399] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +24: [2023-05-10 12:37:41,399] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt... +21: [2023-05-10 12:37:41,399] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... + 0: [2023-05-10 12:37:41,399] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +21: [2023-05-10 12:37:41,399] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +28: [2023-05-10 12:37:41,399] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +28: [2023-05-10 12:37:41,400] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt... +14: [2023-05-10 12:37:41,400] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +21: [2023-05-10 12:37:41,400] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +22: [2023-05-10 12:37:41,400] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +22: [2023-05-10 12:37:41,400] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... + 0: [2023-05-10 12:37:41,400] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +16: [2023-05-10 12:37:41,400] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +28: [2023-05-10 12:37:41,400] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt... +22: [2023-05-10 12:37:41,400] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +22: [2023-05-10 12:37:41,400] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +22: [2023-05-10 12:37:41,400] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. + 0: [2023-05-10 12:37:41,400] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +22: [2023-05-10 12:37:41,400] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +19: [2023-05-10 12:37:41,400] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +19: [2023-05-10 12:37:41,400] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +22: [2023-05-10 12:37:41,400] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +19: [2023-05-10 12:37:41,400] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +19: [2023-05-10 12:37:41,400] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +19: [2023-05-10 12:37:41,400] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... + 4: [2023-05-10 12:37:41,401] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +14: [2023-05-10 12:37:41,401] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. + 2: [2023-05-10 12:37:41,401] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +19: [2023-05-10 12:37:41,401] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. + 4: [2023-05-10 12:37:41,401] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +19: [2023-05-10 12:37:41,401] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... + 4: [2023-05-10 12:37:41,401] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. + 4: [2023-05-10 12:37:41,401] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. + 4: [2023-05-10 12:37:41,401] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... + 4: [2023-05-10 12:37:41,401] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +20: [2023-05-10 12:37:41,401] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +14: [2023-05-10 12:37:41,401] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +30: [2023-05-10 12:37:41,401] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +28: [2023-05-10 12:37:41,401] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... + 4: [2023-05-10 12:37:41,402] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +19: [2023-05-10 12:37:41,402] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... + 4: [2023-05-10 12:37:41,402] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +14: [2023-05-10 12:37:41,402] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +22: [2023-05-10 12:37:41,402] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +15: [2023-05-10 12:37:41,402] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +15: [2023-05-10 12:37:41,402] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +17: [2023-05-10 12:37:41,402] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +17: [2023-05-10 12:37:41,402] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +25: [2023-05-10 12:37:41,403] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +30: [2023-05-10 12:37:41,403] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt... +26: [2023-05-10 12:37:41,403] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +11: [2023-05-10 12:37:41,403] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +18: [2023-05-10 12:37:41,403] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +10: [2023-05-10 12:37:41,403] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +10: [2023-05-10 12:37:41,403] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +10: [2023-05-10 12:37:41,403] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +10: [2023-05-10 12:37:41,403] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +10: [2023-05-10 12:37:41,403] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +10: [2023-05-10 12:37:41,403] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +10: [2023-05-10 12:37:41,403] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +10: [2023-05-10 12:37:41,403] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +14: [2023-05-10 12:37:41,403] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +24: [2023-05-10 12:37:41,403] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +24: [2023-05-10 12:37:41,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt... +13: [2023-05-10 12:37:41,404] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +28: [2023-05-10 12:37:41,404] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +25: [2023-05-10 12:37:41,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +28: [2023-05-10 12:37:41,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +14: [2023-05-10 12:37:41,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +16: [2023-05-10 12:37:41,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +22: [2023-05-10 12:37:41,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +22: [2023-05-10 12:37:41,406] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt... +28: [2023-05-10 12:37:41,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt... +22: [2023-05-10 12:37:41,408] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +22: [2023-05-10 12:37:41,408] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +22: [2023-05-10 12:37:41,408] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt... +22: [2023-05-10 12:37:41,408] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt... +26: [2023-05-10 12:37:41,408] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +29: [2023-05-10 12:37:41,409] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +17: [2023-05-10 12:37:41,410] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +16: [2023-05-10 12:37:41,410] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +29: [2023-05-10 12:37:41,410] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt... +29: [2023-05-10 12:37:41,410] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +29: [2023-05-10 12:37:41,410] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt... + 0: [2023-05-10 12:37:41,410] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +17: [2023-05-10 12:37:41,411] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +31: [2023-05-10 12:37:41,410] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +15: [2023-05-10 12:37:41,411] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +31: [2023-05-10 12:37:41,411] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +18: [2023-05-10 12:37:41,412] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +17: [2023-05-10 12:37:41,412] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +13: [2023-05-10 12:37:41,412] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +22: [2023-05-10 12:37:41,412] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +22: [2023-05-10 12:37:41,412] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt... +22: [2023-05-10 12:37:41,412] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +28: [2023-05-10 12:37:41,413] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... + 2: [2023-05-10 12:37:41,413] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... + 4: [2023-05-10 12:37:41,413] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +19: [2023-05-10 12:37:41,413] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +17: [2023-05-10 12:37:41,414] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +19: [2023-05-10 12:37:41,414] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +14: [2023-05-10 12:37:41,414] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +14: [2023-05-10 12:37:41,414] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +31: [2023-05-10 12:37:41,414] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +31: [2023-05-10 12:37:41,415] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +10: [2023-05-10 12:37:41,415] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +14: [2023-05-10 12:37:41,415] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +19: [2023-05-10 12:37:41,415] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +29: [2023-05-10 12:37:41,416] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +29: [2023-05-10 12:37:41,416] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt... + 4: [2023-05-10 12:37:41,416] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +22: [2023-05-10 12:37:41,418] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +22: [2023-05-10 12:37:41,418] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. + 4: [2023-05-10 12:37:41,420] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. + 4: [2023-05-10 12:37:41,420] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +14: [2023-05-10 12:37:41,420] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +14: [2023-05-10 12:37:41,421] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +14: [2023-05-10 12:37:41,421] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt... +14: [2023-05-10 12:37:41,421] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt... + 4: [2023-05-10 12:37:41,421] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +31: [2023-05-10 12:37:41,421] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... + 0: [2023-05-10 12:37:41,422] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +31: [2023-05-10 12:37:41,422] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +22: [2023-05-10 12:37:41,422] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +19: [2023-05-10 12:37:41,422] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +10: [2023-05-10 12:37:41,422] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +10: [2023-05-10 12:37:41,422] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +21: [2023-05-10 12:37:41,423] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +29: [2023-05-10 12:37:41,423] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +10: [2023-05-10 12:37:41,424] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +21: [2023-05-10 12:37:41,424] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +21: [2023-05-10 12:37:41,424] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +10: [2023-05-10 12:37:41,424] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +29: [2023-05-10 12:37:41,424] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt... +19: [2023-05-10 12:37:41,425] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +19: [2023-05-10 12:37:41,426] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +31: [2023-05-10 12:37:41,427] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +21: [2023-05-10 12:37:41,427] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +22: [2023-05-10 12:37:41,427] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... + 4: [2023-05-10 12:37:41,427] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +14: [2023-05-10 12:37:41,428] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +20: [2023-05-10 12:37:41,428] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt. +19: [2023-05-10 12:37:41,428] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +31: [2023-05-10 12:37:41,429] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +20: [2023-05-10 12:37:41,429] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt. +14: [2023-05-10 12:37:41,429] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt... +14: [2023-05-10 12:37:41,430] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +22: [2023-05-10 12:37:41,431] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +20: [2023-05-10 12:37:41,431] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt. +14: [2023-05-10 12:37:41,431] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt... +20: [2023-05-10 12:37:41,432] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt. + 4: [2023-05-10 12:37:41,432] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +10: [2023-05-10 12:37:41,432] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +10: [2023-05-10 12:37:41,432] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... + 4: [2023-05-10 12:37:41,433] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +26: [2023-05-10 12:37:41,434] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt. +26: [2023-05-10 12:37:41,434] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt. +26: [2023-05-10 12:37:41,435] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt. +26: [2023-05-10 12:37:41,435] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt. +21: [2023-05-10 12:37:41,435] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +10: [2023-05-10 12:37:41,435] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +21: [2023-05-10 12:37:41,436] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +21: [2023-05-10 12:37:41,436] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +19: [2023-05-10 12:37:41,437] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +20: [2023-05-10 12:37:41,438] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +21: [2023-05-10 12:37:41,439] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +22: [2023-05-10 12:37:41,439] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +20: [2023-05-10 12:37:41,440] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +20: [2023-05-10 12:37:41,441] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +20: [2023-05-10 12:37:41,441] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +26: [2023-05-10 12:37:41,444] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... + 3: [2023-05-10 12:37:41,445] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. + 3: [2023-05-10 12:37:41,445] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. + 3: [2023-05-10 12:37:41,445] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. + 3: [2023-05-10 12:37:41,445] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... + 3: [2023-05-10 12:37:41,445] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... + 3: [2023-05-10 12:37:41,445] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... + 3: [2023-05-10 12:37:41,445] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +26: [2023-05-10 12:37:41,445] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... + 3: [2023-05-10 12:37:41,446] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +26: [2023-05-10 12:37:41,446] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +26: [2023-05-10 12:37:41,446] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +22: [2023-05-10 12:37:41,448] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +20: [2023-05-10 12:37:41,454] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +20: [2023-05-10 12:37:41,454] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt... +20: [2023-05-10 12:37:41,456] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +20: [2023-05-10 12:37:41,456] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt... +20: [2023-05-10 12:37:41,456] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +20: [2023-05-10 12:37:41,457] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt... + 3: [2023-05-10 12:37:41,457] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +26: [2023-05-10 12:37:41,463] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +26: [2023-05-10 12:37:41,463] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +26: [2023-05-10 12:37:41,464] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt... +26: [2023-05-10 12:37:41,464] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt... + 3: [2023-05-10 12:37:41,464] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. + 3: [2023-05-10 12:37:41,464] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. + 3: [2023-05-10 12:37:41,465] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +26: [2023-05-10 12:37:41,465] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +26: [2023-05-10 12:37:41,466] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt... + 3: [2023-05-10 12:37:41,467] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +20: [2023-05-10 12:37:41,468] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +23: [2023-05-10 12:37:41,469] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +23: [2023-05-10 12:37:41,469] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +23: [2023-05-10 12:37:41,469] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +23: [2023-05-10 12:37:41,469] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +23: [2023-05-10 12:37:41,470] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +23: [2023-05-10 12:37:41,470] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +20: [2023-05-10 12:37:41,470] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt... +23: [2023-05-10 12:37:41,470] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +31: [2023-05-10 12:37:41,470] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt. +23: [2023-05-10 12:37:41,470] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +31: [2023-05-10 12:37:41,470] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt. +31: [2023-05-10 12:37:41,470] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt. +31: [2023-05-10 12:37:41,470] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt. +26: [2023-05-10 12:37:41,472] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +26: [2023-05-10 12:37:41,474] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt... + 3: [2023-05-10 12:37:41,474] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... + 3: [2023-05-10 12:37:41,475] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... + 3: [2023-05-10 12:37:41,476] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +31: [2023-05-10 12:37:41,479] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +23: [2023-05-10 12:37:41,480] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +31: [2023-05-10 12:37:41,480] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +23: [2023-05-10 12:37:41,481] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +31: [2023-05-10 12:37:41,483] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +31: [2023-05-10 12:37:41,483] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +23: [2023-05-10 12:37:41,484] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +23: [2023-05-10 12:37:41,484] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +23: [2023-05-10 12:37:41,490] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +23: [2023-05-10 12:37:41,490] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +23: [2023-05-10 12:37:41,493] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +30: [2023-05-10 12:37:41,494] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +30: [2023-05-10 12:37:41,494] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +30: [2023-05-10 12:37:41,494] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +30: [2023-05-10 12:37:41,494] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +30: [2023-05-10 12:37:41,494] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +30: [2023-05-10 12:37:41,494] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +30: [2023-05-10 12:37:41,495] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +23: [2023-05-10 12:37:41,496] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +30: [2023-05-10 12:37:41,496] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... + 1: [2023-05-10 12:37:41,497] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt. + 1: [2023-05-10 12:37:41,497] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt. + 1: [2023-05-10 12:37:41,498] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt. +31: [2023-05-10 12:37:41,497] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. + 1: [2023-05-10 12:37:41,498] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt. +31: [2023-05-10 12:37:41,498] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt... +31: [2023-05-10 12:37:41,499] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +31: [2023-05-10 12:37:41,499] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt... + 7: [2023-05-10 12:37:41,504] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. + 7: [2023-05-10 12:37:41,504] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. + 7: [2023-05-10 12:37:41,504] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... + 7: [2023-05-10 12:37:41,504] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. + 7: [2023-05-10 12:37:41,505] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. + 7: [2023-05-10 12:37:41,505] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... + 7: [2023-05-10 12:37:41,505] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... + 7: [2023-05-10 12:37:41,505] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +30: [2023-05-10 12:37:41,506] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. + 1: [2023-05-10 12:37:41,507] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... + 1: [2023-05-10 12:37:41,507] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... + 1: [2023-05-10 12:37:41,507] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +31: [2023-05-10 12:37:41,508] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. + 1: [2023-05-10 12:37:41,510] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +31: [2023-05-10 12:37:41,510] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt... +30: [2023-05-10 12:37:41,511] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. + 1: [2023-05-10 12:37:41,514] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. + 1: [2023-05-10 12:37:41,514] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +31: [2023-05-10 12:37:41,514] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. + 1: [2023-05-10 12:37:41,514] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... + 1: [2023-05-10 12:37:41,514] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +30: [2023-05-10 12:37:41,515] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. + 1: [2023-05-10 12:37:41,515] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. + 1: [2023-05-10 12:37:41,515] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. + 1: [2023-05-10 12:37:41,515] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +30: [2023-05-10 12:37:41,516] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +31: [2023-05-10 12:37:41,516] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt... + 7: [2023-05-10 12:37:41,516] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. + 1: [2023-05-10 12:37:41,517] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... + 8: [2023-05-10 12:37:41,522] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt. + 8: [2023-05-10 12:37:41,522] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt. + 8: [2023-05-10 12:37:41,522] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt. + 8: [2023-05-10 12:37:41,522] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt. +30: [2023-05-10 12:37:41,522] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... + 7: [2023-05-10 12:37:41,523] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. + 7: [2023-05-10 12:37:41,523] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +27: [2023-05-10 12:37:41,524] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. + 1: [2023-05-10 12:37:41,524] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. + 1: [2023-05-10 12:37:41,524] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +27: [2023-05-10 12:37:41,525] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +27: [2023-05-10 12:37:41,525] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +27: [2023-05-10 12:37:41,525] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +27: [2023-05-10 12:37:41,525] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +27: [2023-05-10 12:37:41,525] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... + 1: [2023-05-10 12:37:41,525] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt... + 1: [2023-05-10 12:37:41,525] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt... +27: [2023-05-10 12:37:41,525] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +27: [2023-05-10 12:37:41,525] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... + 7: [2023-05-10 12:37:41,525] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... + 9: [2023-05-10 12:37:41,526] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. + 9: [2023-05-10 12:37:41,526] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... + 9: [2023-05-10 12:37:41,526] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. + 9: [2023-05-10 12:37:41,526] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. + 9: [2023-05-10 12:37:41,526] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... + 9: [2023-05-10 12:37:41,526] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... + 9: [2023-05-10 12:37:41,527] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +30: [2023-05-10 12:37:41,528] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... + 9: [2023-05-10 12:37:41,529] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... + 3: [2023-05-10 12:37:41,529] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt. + 3: [2023-05-10 12:37:41,529] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt. + 3: [2023-05-10 12:37:41,529] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt. + 3: [2023-05-10 12:37:41,529] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt. + 1: [2023-05-10 12:37:41,530] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +30: [2023-05-10 12:37:41,531] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. + 8: [2023-05-10 12:37:41,531] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... + 8: [2023-05-10 12:37:41,531] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... + 7: [2023-05-10 12:37:41,532] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... + 7: [2023-05-10 12:37:41,532] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +15: [2023-05-10 12:37:41,532] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt. +15: [2023-05-10 12:37:41,532] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt. + 1: [2023-05-10 12:37:41,533] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. + 1: [2023-05-10 12:37:41,533] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. + 1: [2023-05-10 12:37:41,533] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt... + 1: [2023-05-10 12:37:41,533] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt... +15: [2023-05-10 12:37:41,533] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt. +15: [2023-05-10 12:37:41,533] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt. + 5: [2023-05-10 12:37:41,533] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt. + 8: [2023-05-10 12:37:41,534] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... + 5: [2023-05-10 12:37:41,534] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt. + 5: [2023-05-10 12:37:41,534] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt. + 5: [2023-05-10 12:37:41,534] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt. +10: [2023-05-10 12:37:41,535] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt. +10: [2023-05-10 12:37:41,535] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt. +10: [2023-05-10 12:37:41,535] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt. +10: [2023-05-10 12:37:41,535] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt. + 2: [2023-05-10 12:37:41,535] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt. + 2: [2023-05-10 12:37:41,536] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt. + 2: [2023-05-10 12:37:41,536] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt. + 8: [2023-05-10 12:37:41,536] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +12: [2023-05-10 12:37:41,536] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt. + 1: [2023-05-10 12:37:41,536] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. + 2: [2023-05-10 12:37:41,536] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt. +27: [2023-05-10 12:37:41,536] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. + 7: [2023-05-10 12:37:41,537] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt. + 7: [2023-05-10 12:37:41,537] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt. + 7: [2023-05-10 12:37:41,537] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt. + 7: [2023-05-10 12:37:41,538] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt. +27: [2023-05-10 12:37:41,538] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. + 9: [2023-05-10 12:37:41,538] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt. + 9: [2023-05-10 12:37:41,538] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt. + 7: [2023-05-10 12:37:41,538] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +12: [2023-05-10 12:37:41,538] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt. + 9: [2023-05-10 12:37:41,538] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt. + 9: [2023-05-10 12:37:41,538] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt. +13: [2023-05-10 12:37:41,539] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt. +13: [2023-05-10 12:37:41,539] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt. +13: [2023-05-10 12:37:41,539] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt. +27: [2023-05-10 12:37:41,539] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +30: [2023-05-10 12:37:41,539] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +13: [2023-05-10 12:37:41,539] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt. + 1: [2023-05-10 12:37:41,539] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. + 9: [2023-05-10 12:37:41,539] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. + 3: [2023-05-10 12:37:41,539] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +12: [2023-05-10 12:37:41,539] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt. + 4: [2023-05-10 12:37:41,539] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt. + 4: [2023-05-10 12:37:41,539] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt. + 4: [2023-05-10 12:37:41,539] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt. +12: [2023-05-10 12:37:41,540] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt. + 3: [2023-05-10 12:37:41,540] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... + 4: [2023-05-10 12:37:41,540] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt. +27: [2023-05-10 12:37:41,540] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. + 1: [2023-05-10 12:37:41,540] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... + 3: [2023-05-10 12:37:41,540] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... + 3: [2023-05-10 12:37:41,541] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +25: [2023-05-10 12:37:41,541] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt. +21: [2023-05-10 12:37:41,541] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt. +21: [2023-05-10 12:37:41,541] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt. +25: [2023-05-10 12:37:41,542] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt. +23: [2023-05-10 12:37:41,542] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt. +23: [2023-05-10 12:37:41,542] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt. +23: [2023-05-10 12:37:41,542] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt. +27: [2023-05-10 12:37:41,542] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt. +23: [2023-05-10 12:37:41,542] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt. +27: [2023-05-10 12:37:41,542] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt. +16: [2023-05-10 12:37:41,542] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt. +16: [2023-05-10 12:37:41,542] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt. +16: [2023-05-10 12:37:41,542] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt. + 9: [2023-05-10 12:37:41,542] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +27: [2023-05-10 12:37:41,542] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt. +16: [2023-05-10 12:37:41,542] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt. +21: [2023-05-10 12:37:41,543] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt. +11: [2023-05-10 12:37:41,543] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt. + 5: [2023-05-10 12:37:41,543] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +11: [2023-05-10 12:37:41,543] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt. +21: [2023-05-10 12:37:41,543] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt. +25: [2023-05-10 12:37:41,543] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt. +11: [2023-05-10 12:37:41,543] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt. +18: [2023-05-10 12:37:41,543] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt. +18: [2023-05-10 12:37:41,543] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt. +18: [2023-05-10 12:37:41,543] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt. +15: [2023-05-10 12:37:41,543] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +11: [2023-05-10 12:37:41,543] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt. +25: [2023-05-10 12:37:41,543] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt. +15: [2023-05-10 12:37:41,543] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +27: [2023-05-10 12:37:41,543] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt. +18: [2023-05-10 12:37:41,543] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt. +15: [2023-05-10 12:37:41,544] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +15: [2023-05-10 12:37:41,544] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... + 5: [2023-05-10 12:37:41,545] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +10: [2023-05-10 12:37:41,545] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... + 5: [2023-05-10 12:37:41,545] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... + 5: [2023-05-10 12:37:41,545] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +24: [2023-05-10 12:37:41,545] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt. +24: [2023-05-10 12:37:41,545] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt. +24: [2023-05-10 12:37:41,546] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt. +24: [2023-05-10 12:37:41,546] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt. +10: [2023-05-10 12:37:41,546] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +10: [2023-05-10 12:37:41,546] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +27: [2023-05-10 12:37:41,546] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... + 1: [2023-05-10 12:37:41,546] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... + 7: [2023-05-10 12:37:41,546] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +10: [2023-05-10 12:37:41,546] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... + 8: [2023-05-10 12:37:41,547] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. + 8: [2023-05-10 12:37:41,548] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt... +13: [2023-05-10 12:37:41,548] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +27: [2023-05-10 12:37:41,548] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +12: [2023-05-10 12:37:41,548] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... + 8: [2023-05-10 12:37:41,548] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +12: [2023-05-10 12:37:41,548] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... + 8: [2023-05-10 12:37:41,548] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt... +13: [2023-05-10 12:37:41,549] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... + 9: [2023-05-10 12:37:41,549] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +13: [2023-05-10 12:37:41,549] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... + 4: [2023-05-10 12:37:41,549] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... + 2: [2023-05-10 12:37:41,549] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... + 7: [2023-05-10 12:37:41,549] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +13: [2023-05-10 12:37:41,549] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... + 2: [2023-05-10 12:37:41,549] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +12: [2023-05-10 12:37:41,549] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... + 7: [2023-05-10 12:37:41,549] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... + 7: [2023-05-10 12:37:41,549] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... + 4: [2023-05-10 12:37:41,549] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +12: [2023-05-10 12:37:41,550] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... + 7: [2023-05-10 12:37:41,550] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +20: [2023-05-10 12:37:41,550] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt. + 9: [2023-05-10 12:37:41,550] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +20: [2023-05-10 12:37:41,550] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt. +20: [2023-05-10 12:37:41,550] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt. + 4: [2023-05-10 12:37:41,550] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +20: [2023-05-10 12:37:41,550] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt. + 1: [2023-05-10 12:37:41,550] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +27: [2023-05-10 12:37:41,550] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... + 9: [2023-05-10 12:37:41,550] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +27: [2023-05-10 12:37:41,550] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... + 4: [2023-05-10 12:37:41,550] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +23: [2023-05-10 12:37:41,551] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... + 9: [2023-05-10 12:37:41,551] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +23: [2023-05-10 12:37:41,551] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +25: [2023-05-10 12:37:41,551] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... + 3: [2023-05-10 12:37:41,551] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +16: [2023-05-10 12:37:41,552] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +27: [2023-05-10 12:37:41,552] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +23: [2023-05-10 12:37:41,552] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +16: [2023-05-10 12:37:41,552] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +16: [2023-05-10 12:37:41,552] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +16: [2023-05-10 12:37:41,552] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +21: [2023-05-10 12:37:41,552] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... + 3: [2023-05-10 12:37:41,552] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt... + 2: [2023-05-10 12:37:41,552] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... + 3: [2023-05-10 12:37:41,552] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. + 3: [2023-05-10 12:37:41,552] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt... + 2: [2023-05-10 12:37:41,552] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +18: [2023-05-10 12:37:41,553] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... + 8: [2023-05-10 12:37:41,552] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. + 8: [2023-05-10 12:37:41,553] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt... +18: [2023-05-10 12:37:41,553] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... + 9: [2023-05-10 12:37:41,553] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +11: [2023-05-10 12:37:41,553] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +18: [2023-05-10 12:37:41,553] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... + 9: [2023-05-10 12:37:41,553] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +27: [2023-05-10 12:37:41,553] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +18: [2023-05-10 12:37:41,554] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +27: [2023-05-10 12:37:41,554] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... + 3: [2023-05-10 12:37:41,554] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +27: [2023-05-10 12:37:41,554] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +25: [2023-05-10 12:37:41,554] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +25: [2023-05-10 12:37:41,554] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... + 3: [2023-05-10 12:37:41,554] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt... +21: [2023-05-10 12:37:41,554] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +25: [2023-05-10 12:37:41,554] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +23: [2023-05-10 12:37:41,554] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... + 5: [2023-05-10 12:37:41,554] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. + 9: [2023-05-10 12:37:41,555] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +24: [2023-05-10 12:37:41,555] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... + 5: [2023-05-10 12:37:41,555] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt... +24: [2023-05-10 12:37:41,555] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +11: [2023-05-10 12:37:41,555] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +21: [2023-05-10 12:37:41,556] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +21: [2023-05-10 12:37:41,557] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +24: [2023-05-10 12:37:41,557] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +24: [2023-05-10 12:37:41,557] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +11: [2023-05-10 12:37:41,557] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +11: [2023-05-10 12:37:41,558] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... + 1: [2023-05-10 12:37:41,558] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +20: [2023-05-10 12:37:41,559] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... + 9: [2023-05-10 12:37:41,559] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +10: [2023-05-10 12:37:41,559] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +10: [2023-05-10 12:37:41,560] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +10: [2023-05-10 12:37:41,560] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt... +10: [2023-05-10 12:37:41,560] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt... +15: [2023-05-10 12:37:41,560] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +15: [2023-05-10 12:37:41,561] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt... +15: [2023-05-10 12:37:41,561] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +10: [2023-05-10 12:37:41,561] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +10: [2023-05-10 12:37:41,561] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt... +15: [2023-05-10 12:37:41,561] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +15: [2023-05-10 12:37:41,561] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt... +15: [2023-05-10 12:37:41,561] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt... +20: [2023-05-10 12:37:41,562] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +20: [2023-05-10 12:37:41,562] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +25: [2023-05-10 12:37:41,562] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +20: [2023-05-10 12:37:41,562] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +12: [2023-05-10 12:37:41,563] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. + 5: [2023-05-10 12:37:41,563] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. + 5: [2023-05-10 12:37:41,563] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt... + 9: [2023-05-10 12:37:41,563] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +25: [2023-05-10 12:37:41,563] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt... + 7: [2023-05-10 12:37:41,563] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +12: [2023-05-10 12:37:41,564] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt... + 8: [2023-05-10 12:37:41,564] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +12: [2023-05-10 12:37:41,564] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +12: [2023-05-10 12:37:41,564] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt... +12: [2023-05-10 12:37:41,564] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +12: [2023-05-10 12:37:41,565] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt... + 2: [2023-05-10 12:37:41,565] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +13: [2023-05-10 12:37:41,564] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +13: [2023-05-10 12:37:41,564] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. + 2: [2023-05-10 12:37:41,565] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +30: [2023-05-10 12:37:41,565] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt. +30: [2023-05-10 12:37:41,565] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt. + 7: [2023-05-10 12:37:41,565] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. + 7: [2023-05-10 12:37:41,565] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +13: [2023-05-10 12:37:41,565] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt... +13: [2023-05-10 12:37:41,565] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt... + 2: [2023-05-10 12:37:41,565] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt... + 2: [2023-05-10 12:37:41,565] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt... + 4: [2023-05-10 12:37:41,565] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. + 4: [2023-05-10 12:37:41,566] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt... + 5: [2023-05-10 12:37:41,565] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. + 5: [2023-05-10 12:37:41,565] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt... + 5: [2023-05-10 12:37:41,566] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. + 4: [2023-05-10 12:37:41,566] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. + 5: [2023-05-10 12:37:41,566] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt... + 4: [2023-05-10 12:37:41,566] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt... + 7: [2023-05-10 12:37:41,566] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt... + 7: [2023-05-10 12:37:41,566] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt... + 7: [2023-05-10 12:37:41,566] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt... + 8: [2023-05-10 12:37:41,565] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt... +21: [2023-05-10 12:37:41,565] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +21: [2023-05-10 12:37:41,566] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt... +13: [2023-05-10 12:37:41,566] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +29: [2023-05-10 12:37:41,566] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +13: [2023-05-10 12:37:41,566] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt... +29: [2023-05-10 12:37:41,566] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +29: [2023-05-10 12:37:41,566] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +29: [2023-05-10 12:37:41,566] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +15: [2023-05-10 12:37:41,566] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +15: [2023-05-10 12:37:41,566] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt... + 1: [2023-05-10 12:37:41,567] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... + 9: [2023-05-10 12:37:41,567] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +30: [2023-05-10 12:37:41,567] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt. +30: [2023-05-10 12:37:41,567] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt. +23: [2023-05-10 12:37:41,567] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +23: [2023-05-10 12:37:41,567] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +16: [2023-05-10 12:37:41,567] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. + 2: [2023-05-10 12:37:41,567] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. + 2: [2023-05-10 12:37:41,567] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +23: [2023-05-10 12:37:41,567] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +16: [2023-05-10 12:37:41,567] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. + 2: [2023-05-10 12:37:41,568] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt... + 2: [2023-05-10 12:37:41,568] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt... +23: [2023-05-10 12:37:41,567] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt... +23: [2023-05-10 12:37:41,567] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt... +18: [2023-05-10 12:37:41,567] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +23: [2023-05-10 12:37:41,568] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt... +16: [2023-05-10 12:37:41,568] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt... +24: [2023-05-10 12:37:41,567] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +16: [2023-05-10 12:37:41,568] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt... +27: [2023-05-10 12:37:41,568] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +18: [2023-05-10 12:37:41,568] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt... + 7: [2023-05-10 12:37:41,568] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +25: [2023-05-10 12:37:41,568] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +25: [2023-05-10 12:37:41,568] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +25: [2023-05-10 12:37:41,568] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt... +25: [2023-05-10 12:37:41,568] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt... +11: [2023-05-10 12:37:41,567] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. + 7: [2023-05-10 12:37:41,568] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt... + 9: [2023-05-10 12:37:41,568] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt... +24: [2023-05-10 12:37:41,568] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt... +24: [2023-05-10 12:37:41,568] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +27: [2023-05-10 12:37:41,568] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt... +24: [2023-05-10 12:37:41,568] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt... +11: [2023-05-10 12:37:41,568] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt... +13: [2023-05-10 12:37:41,569] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +21: [2023-05-10 12:37:41,569] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +18: [2023-05-10 12:37:41,569] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +18: [2023-05-10 12:37:41,569] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +21: [2023-05-10 12:37:41,569] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt... +18: [2023-05-10 12:37:41,569] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt... +18: [2023-05-10 12:37:41,569] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt... +21: [2023-05-10 12:37:41,569] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +29: [2023-05-10 12:37:41,569] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +29: [2023-05-10 12:37:41,569] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +21: [2023-05-10 12:37:41,570] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt... +13: [2023-05-10 12:37:41,570] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt... + 3: [2023-05-10 12:37:41,570] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +11: [2023-05-10 12:37:41,570] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +11: [2023-05-10 12:37:41,570] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt... +29: [2023-05-10 12:37:41,571] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... + 4: [2023-05-10 12:37:41,571] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. + 4: [2023-05-10 12:37:41,571] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt... +16: [2023-05-10 12:37:41,571] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +29: [2023-05-10 12:37:41,571] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +27: [2023-05-10 12:37:41,571] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +11: [2023-05-10 12:37:41,571] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +20: [2023-05-10 12:37:41,571] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +11: [2023-05-10 12:37:41,571] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt... + 9: [2023-05-10 12:37:41,572] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... + 3: [2023-05-10 12:37:41,572] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt... +11: [2023-05-10 12:37:41,572] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +11: [2023-05-10 12:37:41,572] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt... +20: [2023-05-10 12:37:41,572] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt... +16: [2023-05-10 12:37:41,572] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +16: [2023-05-10 12:37:41,572] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt... +16: [2023-05-10 12:37:41,572] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt... +27: [2023-05-10 12:37:41,572] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt... + 9: [2023-05-10 12:37:41,572] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. + 9: [2023-05-10 12:37:41,572] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt... +18: [2023-05-10 12:37:41,573] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +18: [2023-05-10 12:37:41,573] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt... + 9: [2023-05-10 12:37:41,573] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. + 9: [2023-05-10 12:37:41,573] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt... +30: [2023-05-10 12:37:41,574] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +10: [2023-05-10 12:37:41,575] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +12: [2023-05-10 12:37:41,575] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. + 4: [2023-05-10 12:37:41,576] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +10: [2023-05-10 12:37:41,576] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt... +25: [2023-05-10 12:37:41,576] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +21: [2023-05-10 12:37:41,576] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +21: [2023-05-10 12:37:41,576] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt... +30: [2023-05-10 12:37:41,576] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +12: [2023-05-10 12:37:41,577] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt... +19: [2023-05-10 12:37:41,577] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt. +19: [2023-05-10 12:37:41,577] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt. +19: [2023-05-10 12:37:41,577] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt. +25: [2023-05-10 12:37:41,577] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt... +19: [2023-05-10 12:37:41,577] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt. + 4: [2023-05-10 12:37:41,577] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt... +24: [2023-05-10 12:37:41,577] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. + 9: [2023-05-10 12:37:41,578] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. + 9: [2023-05-10 12:37:41,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt... +29: [2023-05-10 12:37:41,578] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +24: [2023-05-10 12:37:41,578] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +24: [2023-05-10 12:37:41,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt... +24: [2023-05-10 12:37:41,579] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt... +30: [2023-05-10 12:37:41,579] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +30: [2023-05-10 12:37:41,579] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... + 6: [2023-05-10 12:37:41,579] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt. + 6: [2023-05-10 12:37:41,579] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt. + 6: [2023-05-10 12:37:41,579] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt. + 6: [2023-05-10 12:37:41,579] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt. +29: [2023-05-10 12:37:41,580] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +20: [2023-05-10 12:37:41,580] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +20: [2023-05-10 12:37:41,580] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt... +27: [2023-05-10 12:37:41,581] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +27: [2023-05-10 12:37:41,581] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +27: [2023-05-10 12:37:41,583] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt... +23: [2023-05-10 12:37:41,583] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +27: [2023-05-10 12:37:41,583] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt... +23: [2023-05-10 12:37:41,585] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt... +20: [2023-05-10 12:37:41,585] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +20: [2023-05-10 12:37:41,585] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. + 4: [2023-05-10 12:37:41,585] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. + 4: [2023-05-10 12:37:41,585] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. + 4: [2023-05-10 12:37:41,585] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... + 4: [2023-05-10 12:37:41,585] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... + 4: [2023-05-10 12:37:41,586] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. + 4: [2023-05-10 12:37:41,586] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +19: [2023-05-10 12:37:41,587] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +22: [2023-05-10 12:37:41,587] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt. +20: [2023-05-10 12:37:41,587] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt... +20: [2023-05-10 12:37:41,587] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt... +22: [2023-05-10 12:37:41,587] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt. +22: [2023-05-10 12:37:41,587] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt. +29: [2023-05-10 12:37:41,587] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +19: [2023-05-10 12:37:41,587] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... + 4: [2023-05-10 12:37:41,588] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +22: [2023-05-10 12:37:41,588] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt. +19: [2023-05-10 12:37:41,588] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... + 4: [2023-05-10 12:37:41,588] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... + 6: [2023-05-10 12:37:41,588] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +19: [2023-05-10 12:37:41,588] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +29: [2023-05-10 12:37:41,590] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt. +29: [2023-05-10 12:37:41,590] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt. + 6: [2023-05-10 12:37:41,590] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +29: [2023-05-10 12:37:41,590] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt. + 6: [2023-05-10 12:37:41,590] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +29: [2023-05-10 12:37:41,591] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt. +30: [2023-05-10 12:37:41,592] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +29: [2023-05-10 12:37:41,592] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... + 6: [2023-05-10 12:37:41,593] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +30: [2023-05-10 12:37:41,593] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +30: [2023-05-10 12:37:41,594] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt... +30: [2023-05-10 12:37:41,594] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt... +30: [2023-05-10 12:37:41,595] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +30: [2023-05-10 12:37:41,595] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt... +22: [2023-05-10 12:37:41,596] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +22: [2023-05-10 12:37:41,597] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... + 4: [2023-05-10 12:37:41,598] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +22: [2023-05-10 12:37:41,599] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... + 4: [2023-05-10 12:37:41,599] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +22: [2023-05-10 12:37:41,600] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +29: [2023-05-10 12:37:41,600] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +29: [2023-05-10 12:37:41,601] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +29: [2023-05-10 12:37:41,601] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +19: [2023-05-10 12:37:41,602] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +19: [2023-05-10 12:37:41,602] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +19: [2023-05-10 12:37:41,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt... +19: [2023-05-10 12:37:41,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt... +29: [2023-05-10 12:37:41,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +29: [2023-05-10 12:37:41,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +19: [2023-05-10 12:37:41,604] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +19: [2023-05-10 12:37:41,605] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt... +30: [2023-05-10 12:37:41,607] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. + 4: [2023-05-10 12:37:41,608] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +29: [2023-05-10 12:37:41,608] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +30: [2023-05-10 12:37:41,608] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt... +19: [2023-05-10 12:37:41,609] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +19: [2023-05-10 12:37:41,609] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt... + 4: [2023-05-10 12:37:41,609] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +29: [2023-05-10 12:37:41,610] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +17: [2023-05-10 12:37:41,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt. +17: [2023-05-10 12:37:41,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt. + 0: [2023-05-10 12:37:41,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt. +17: [2023-05-10 12:37:41,612] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt. +17: [2023-05-10 12:37:41,612] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt. + 0: [2023-05-10 12:37:41,612] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt. + 0: [2023-05-10 12:37:41,614] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt. + 0: [2023-05-10 12:37:41,614] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_11-model_01-model_states.pt. +17: [2023-05-10 12:37:41,616] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +17: [2023-05-10 12:37:41,617] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +17: [2023-05-10 12:37:41,617] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +17: [2023-05-10 12:37:41,617] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +17: [2023-05-10 12:37:41,617] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +17: [2023-05-10 12:37:41,618] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... + 4: [2023-05-10 12:37:41,618] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +17: [2023-05-10 12:37:41,619] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +17: [2023-05-10 12:37:41,619] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... + 0: [2023-05-10 12:37:41,621] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... + 4: [2023-05-10 12:37:41,621] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +29: [2023-05-10 12:37:41,621] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +17: [2023-05-10 12:37:41,622] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +17: [2023-05-10 12:37:41,622] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +17: [2023-05-10 12:37:41,622] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +29: [2023-05-10 12:37:41,622] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +17: [2023-05-10 12:37:41,623] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... +29: [2023-05-10 12:37:41,623] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt... +12: [2023-05-10 12:37:41,625] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +12: [2023-05-10 12:37:41,625] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +12: [2023-05-10 12:37:41,625] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +12: [2023-05-10 12:37:41,625] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +12: [2023-05-10 12:37:41,625] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +12: [2023-05-10 12:37:41,625] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +12: [2023-05-10 12:37:41,625] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +12: [2023-05-10 12:37:41,626] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... + 0: [2023-05-10 12:37:41,626] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... + 0: [2023-05-10 12:37:41,626] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... + 0: [2023-05-10 12:37:41,628] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt... + 4: [2023-05-10 12:37:41,628] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +29: [2023-05-10 12:37:41,628] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +29: [2023-05-10 12:37:41,628] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt... + 4: [2023-05-10 12:37:41,630] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... + 0: [2023-05-10 12:37:41,633] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +29: [2023-05-10 12:37:41,633] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. + 0: [2023-05-10 12:37:41,634] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt... +29: [2023-05-10 12:37:41,635] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt... +29: [2023-05-10 12:37:41,639] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +28: [2023-05-10 12:37:41,639] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +28: [2023-05-10 12:37:41,639] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +28: [2023-05-10 12:37:41,639] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +28: [2023-05-10 12:37:41,640] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +28: [2023-05-10 12:37:41,640] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +28: [2023-05-10 12:37:41,640] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +12: [2023-05-10 12:37:41,641] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +12: [2023-05-10 12:37:41,641] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +29: [2023-05-10 12:37:41,641] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt... +28: [2023-05-10 12:37:41,641] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +28: [2023-05-10 12:37:41,641] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +17: [2023-05-10 12:37:41,641] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +12: [2023-05-10 12:37:41,642] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +17: [2023-05-10 12:37:41,643] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +17: [2023-05-10 12:37:41,643] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +17: [2023-05-10 12:37:41,643] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt... +17: [2023-05-10 12:37:41,643] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt... +20: [2023-05-10 12:37:41,643] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +20: [2023-05-10 12:37:41,644] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +20: [2023-05-10 12:37:41,644] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +17: [2023-05-10 12:37:41,644] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +20: [2023-05-10 12:37:41,645] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +20: [2023-05-10 12:37:41,646] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +20: [2023-05-10 12:37:41,646] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +20: [2023-05-10 12:37:41,646] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +26: [2023-05-10 12:37:41,646] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +26: [2023-05-10 12:37:41,646] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +17: [2023-05-10 12:37:41,646] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +26: [2023-05-10 12:37:41,646] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +26: [2023-05-10 12:37:41,646] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +26: [2023-05-10 12:37:41,647] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +17: [2023-05-10 12:37:41,647] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt... +12: [2023-05-10 12:37:41,647] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +26: [2023-05-10 12:37:41,647] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +26: [2023-05-10 12:37:41,647] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +26: [2023-05-10 12:37:41,647] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +17: [2023-05-10 12:37:41,647] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. +17: [2023-05-10 12:37:41,647] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt... +20: [2023-05-10 12:37:41,648] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... + 0: [2023-05-10 12:37:41,648] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. + 0: [2023-05-10 12:37:41,648] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. + 0: [2023-05-10 12:37:41,648] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt... + 0: [2023-05-10 12:37:41,648] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt... +16: [2023-05-10 12:37:41,649] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +16: [2023-05-10 12:37:41,649] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +16: [2023-05-10 12:37:41,649] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +16: [2023-05-10 12:37:41,649] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +16: [2023-05-10 12:37:41,649] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +16: [2023-05-10 12:37:41,649] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +16: [2023-05-10 12:37:41,649] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +16: [2023-05-10 12:37:41,649] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... + 0: [2023-05-10 12:37:41,649] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_00-model_states.pt. + 0: [2023-05-10 12:37:41,649] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt... + 6: [2023-05-10 12:37:41,650] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. + 6: [2023-05-10 12:37:41,650] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. + 6: [2023-05-10 12:37:41,650] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. + 6: [2023-05-10 12:37:41,650] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... + 6: [2023-05-10 12:37:41,650] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. + 6: [2023-05-10 12:37:41,650] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. + 6: [2023-05-10 12:37:41,650] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. + 6: [2023-05-10 12:37:41,650] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. + 6: [2023-05-10 12:37:41,651] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... + 6: [2023-05-10 12:37:41,651] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +12: [2023-05-10 12:37:41,651] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +18: [2023-05-10 12:37:41,650] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +18: [2023-05-10 12:37:41,650] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +18: [2023-05-10 12:37:41,650] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +18: [2023-05-10 12:37:41,650] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +18: [2023-05-10 12:37:41,650] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +18: [2023-05-10 12:37:41,650] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +18: [2023-05-10 12:37:41,651] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. + 6: [2023-05-10 12:37:41,651] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt... + 6: [2023-05-10 12:37:41,651] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt... +18: [2023-05-10 12:37:41,651] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +12: [2023-05-10 12:37:41,652] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +28: [2023-05-10 12:37:41,651] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. + 6: [2023-05-10 12:37:41,652] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... + 6: [2023-05-10 12:37:41,652] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... + 6: [2023-05-10 12:37:41,652] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt... + 6: [2023-05-10 12:37:41,652] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt... +17: [2023-05-10 12:37:41,652] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +12: [2023-05-10 12:37:41,654] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +17: [2023-05-10 12:37:41,654] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +28: [2023-05-10 12:37:41,657] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +12: [2023-05-10 12:37:41,657] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +17: [2023-05-10 12:37:41,657] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +17: [2023-05-10 12:37:41,657] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +26: [2023-05-10 12:37:41,658] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +20: [2023-05-10 12:37:41,658] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +26: [2023-05-10 12:37:41,659] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +20: [2023-05-10 12:37:41,660] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +28: [2023-05-10 12:37:41,660] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... + 1: [2023-05-10 12:37:41,660] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt. + 1: [2023-05-10 12:37:41,660] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt. + 1: [2023-05-10 12:37:41,660] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt. +10: [2023-05-10 12:37:41,660] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +10: [2023-05-10 12:37:41,660] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +10: [2023-05-10 12:37:41,660] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +10: [2023-05-10 12:37:41,660] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... + 0: [2023-05-10 12:37:41,660] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. + 0: [2023-05-10 12:37:41,660] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. + 0: [2023-05-10 12:37:41,660] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. + 0: [2023-05-10 12:37:41,661] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... + 0: [2023-05-10 12:37:41,661] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... + 0: [2023-05-10 12:37:41,661] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... + 0: [2023-05-10 12:37:41,661] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +24: [2023-05-10 12:37:41,661] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. + 0: [2023-05-10 12:37:41,661] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +24: [2023-05-10 12:37:41,661] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... + 1: [2023-05-10 12:37:41,661] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt. +24: [2023-05-10 12:37:41,661] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +24: [2023-05-10 12:37:41,661] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +16: [2023-05-10 12:37:41,661] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +24: [2023-05-10 12:37:41,661] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +24: [2023-05-10 12:37:41,661] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +10: [2023-05-10 12:37:41,661] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +10: [2023-05-10 12:37:41,662] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +16: [2023-05-10 12:37:41,662] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +17: [2023-05-10 12:37:41,662] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +10: [2023-05-10 12:37:41,663] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... + 3: [2023-05-10 12:37:41,663] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. + 3: [2023-05-10 12:37:41,663] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +14: [2023-05-10 12:37:41,663] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +14: [2023-05-10 12:37:41,663] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +14: [2023-05-10 12:37:41,663] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +14: [2023-05-10 12:37:41,663] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +14: [2023-05-10 12:37:41,663] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +14: [2023-05-10 12:37:41,663] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +10: [2023-05-10 12:37:41,663] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... + 3: [2023-05-10 12:37:41,663] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +16: [2023-05-10 12:37:41,664] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +24: [2023-05-10 12:37:41,664] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +14: [2023-05-10 12:37:41,664] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +24: [2023-05-10 12:37:41,664] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +14: [2023-05-10 12:37:41,664] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... + 3: [2023-05-10 12:37:41,665] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... + 3: [2023-05-10 12:37:41,665] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. + 3: [2023-05-10 12:37:41,665] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. + 3: [2023-05-10 12:37:41,665] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... + 6: [2023-05-10 12:37:41,665] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +17: [2023-05-10 12:37:41,666] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +26: [2023-05-10 12:37:41,667] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +26: [2023-05-10 12:37:41,667] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. + 3: [2023-05-10 12:37:41,667] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +26: [2023-05-10 12:37:41,668] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +26: [2023-05-10 12:37:41,668] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... + 1: [2023-05-10 12:37:41,669] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +28: [2023-05-10 12:37:41,669] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... + 6: [2023-05-10 12:37:41,669] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. + 1: [2023-05-10 12:37:41,670] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +16: [2023-05-10 12:37:41,670] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +20: [2023-05-10 12:37:41,670] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +16: [2023-05-10 12:37:41,671] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +20: [2023-05-10 12:37:41,672] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... + 1: [2023-05-10 12:37:41,672] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... + 1: [2023-05-10 12:37:41,672] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +20: [2023-05-10 12:37:41,672] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +25: [2023-05-10 12:37:41,672] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +25: [2023-05-10 12:37:41,672] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +24: [2023-05-10 12:37:41,672] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +25: [2023-05-10 12:37:41,672] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +25: [2023-05-10 12:37:41,672] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +25: [2023-05-10 12:37:41,673] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +25: [2023-05-10 12:37:41,673] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +25: [2023-05-10 12:37:41,673] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +28: [2023-05-10 12:37:41,673] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +25: [2023-05-10 12:37:41,673] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +20: [2023-05-10 12:37:41,673] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +16: [2023-05-10 12:37:41,673] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +18: [2023-05-10 12:37:41,673] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +18: [2023-05-10 12:37:41,673] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +18: [2023-05-10 12:37:41,673] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +24: [2023-05-10 12:37:41,674] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. + 6: [2023-05-10 12:37:41,675] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +15: [2023-05-10 12:37:41,675] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +15: [2023-05-10 12:37:41,675] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +15: [2023-05-10 12:37:41,675] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +15: [2023-05-10 12:37:41,675] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +15: [2023-05-10 12:37:41,675] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +11: [2023-05-10 12:37:41,675] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +11: [2023-05-10 12:37:41,675] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +16: [2023-05-10 12:37:41,675] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +24: [2023-05-10 12:37:41,675] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +15: [2023-05-10 12:37:41,675] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +15: [2023-05-10 12:37:41,675] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +15: [2023-05-10 12:37:41,675] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... + 5: [2023-05-10 12:37:41,676] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. + 5: [2023-05-10 12:37:41,676] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. + 5: [2023-05-10 12:37:41,676] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. + 5: [2023-05-10 12:37:41,676] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... + 5: [2023-05-10 12:37:41,676] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... + 5: [2023-05-10 12:37:41,676] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +11: [2023-05-10 12:37:41,676] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. + 5: [2023-05-10 12:37:41,677] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. + 5: [2023-05-10 12:37:41,677] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +14: [2023-05-10 12:37:41,677] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +14: [2023-05-10 12:37:41,677] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +11: [2023-05-10 12:37:41,678] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +11: [2023-05-10 12:37:41,678] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +11: [2023-05-10 12:37:41,678] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +24: [2023-05-10 12:37:41,678] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +14: [2023-05-10 12:37:41,678] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +10: [2023-05-10 12:37:41,678] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +10: [2023-05-10 12:37:41,678] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +14: [2023-05-10 12:37:41,678] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. + 6: [2023-05-10 12:37:41,678] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... + 3: [2023-05-10 12:37:41,678] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +28: [2023-05-10 12:37:41,679] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +26: [2023-05-10 12:37:41,679] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +26: [2023-05-10 12:37:41,679] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... + 6: [2023-05-10 12:37:41,679] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +16: [2023-05-10 12:37:41,679] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +11: [2023-05-10 12:37:41,679] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +11: [2023-05-10 12:37:41,679] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +18: [2023-05-10 12:37:41,680] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. + 6: [2023-05-10 12:37:41,680] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. + 3: [2023-05-10 12:37:41,681] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. + 2: [2023-05-10 12:37:41,681] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. + 2: [2023-05-10 12:37:41,681] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. + 2: [2023-05-10 12:37:41,681] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... + 2: [2023-05-10 12:37:41,681] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +20: [2023-05-10 12:37:41,681] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... + 2: [2023-05-10 12:37:41,681] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. + 2: [2023-05-10 12:37:41,681] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +21: [2023-05-10 12:37:41,681] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +21: [2023-05-10 12:37:41,681] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +28: [2023-05-10 12:37:41,681] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +20: [2023-05-10 12:37:41,682] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... + 8: [2023-05-10 12:37:41,683] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. + 8: [2023-05-10 12:37:41,683] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +13: [2023-05-10 12:37:41,683] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +13: [2023-05-10 12:37:41,683] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +13: [2023-05-10 12:37:41,683] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. + 2: [2023-05-10 12:37:41,683] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +13: [2023-05-10 12:37:41,683] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +13: [2023-05-10 12:37:41,683] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +13: [2023-05-10 12:37:41,683] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +24: [2023-05-10 12:37:41,683] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... + 2: [2023-05-10 12:37:41,683] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +21: [2023-05-10 12:37:41,683] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +21: [2023-05-10 12:37:41,683] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +18: [2023-05-10 12:37:41,684] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +18: [2023-05-10 12:37:41,684] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +25: [2023-05-10 12:37:41,684] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +25: [2023-05-10 12:37:41,684] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +21: [2023-05-10 12:37:41,684] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +21: [2023-05-10 12:37:41,684] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. + 8: [2023-05-10 12:37:41,684] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +18: [2023-05-10 12:37:41,684] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +21: [2023-05-10 12:37:41,684] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +21: [2023-05-10 12:37:41,684] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +13: [2023-05-10 12:37:41,684] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +13: [2023-05-10 12:37:41,685] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... + 0: [2023-05-10 12:37:41,685] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. + 0: [2023-05-10 12:37:41,685] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. + 0: [2023-05-10 12:37:41,685] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +24: [2023-05-10 12:37:41,685] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... + 1: [2023-05-10 12:37:41,685] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. + 8: [2023-05-10 12:37:41,685] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. + 8: [2023-05-10 12:37:41,685] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. + 1: [2023-05-10 12:37:41,685] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt... + 8: [2023-05-10 12:37:41,685] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... + 8: [2023-05-10 12:37:41,685] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... + 8: [2023-05-10 12:37:41,686] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +10: [2023-05-10 12:37:41,686] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. + 3: [2023-05-10 12:37:41,687] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +28: [2023-05-10 12:37:41,687] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +24: [2023-05-10 12:37:41,687] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +24: [2023-05-10 12:37:41,688] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... + 1: [2023-05-10 12:37:41,687] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. + 1: [2023-05-10 12:37:41,687] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt... +10: [2023-05-10 12:37:41,688] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +14: [2023-05-10 12:37:41,688] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +25: [2023-05-10 12:37:41,688] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +25: [2023-05-10 12:37:41,688] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. + 6: [2023-05-10 12:37:41,688] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +15: [2023-05-10 12:37:41,689] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +10: [2023-05-10 12:37:41,689] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... + 0: [2023-05-10 12:37:41,689] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +14: [2023-05-10 12:37:41,689] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... + 6: [2023-05-10 12:37:41,689] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +11: [2023-05-10 12:37:41,689] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +18: [2023-05-10 12:37:41,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +14: [2023-05-10 12:37:41,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... + 3: [2023-05-10 12:37:41,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +14: [2023-05-10 12:37:41,691] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +11: [2023-05-10 12:37:41,691] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. + 5: [2023-05-10 12:37:41,692] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. + 5: [2023-05-10 12:37:41,692] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. + 5: [2023-05-10 12:37:41,693] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +15: [2023-05-10 12:37:41,693] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. + 5: [2023-05-10 12:37:41,693] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. + 2: [2023-05-10 12:37:41,693] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. + 7: [2023-05-10 12:37:41,694] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. + 7: [2023-05-10 12:37:41,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... + 7: [2023-05-10 12:37:41,694] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. + 7: [2023-05-10 12:37:41,694] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. + 7: [2023-05-10 12:37:41,694] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. + 7: [2023-05-10 12:37:41,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... + 7: [2023-05-10 12:37:41,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... + 7: [2023-05-10 12:37:41,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +15: [2023-05-10 12:37:41,694] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +15: [2023-05-10 12:37:41,694] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +25: [2023-05-10 12:37:41,695] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +10: [2023-05-10 12:37:41,695] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +25: [2023-05-10 12:37:41,695] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +21: [2023-05-10 12:37:41,695] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. + 0: [2023-05-10 12:37:41,695] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... + 0: [2023-05-10 12:37:41,696] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +13: [2023-05-10 12:37:41,696] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. + 2: [2023-05-10 12:37:41,696] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. + 2: [2023-05-10 12:37:41,697] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. + 3: [2023-05-10 12:37:41,697] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +25: [2023-05-10 12:37:41,698] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +25: [2023-05-10 12:37:41,698] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +15: [2023-05-10 12:37:41,698] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +10: [2023-05-10 12:37:41,698] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. + 1: [2023-05-10 12:37:41,698] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. + 0: [2023-05-10 12:37:41,698] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... + 2: [2023-05-10 12:37:41,699] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. + 3: [2023-05-10 12:37:41,699] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +21: [2023-05-10 12:37:41,699] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. + 0: [2023-05-10 12:37:41,699] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... + 1: [2023-05-10 12:37:41,699] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt... + 8: [2023-05-10 12:37:41,700] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +11: [2023-05-10 12:37:41,700] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... + 1: [2023-05-10 12:37:41,701] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +11: [2023-05-10 12:37:41,701] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +31: [2023-05-10 12:37:41,702] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +31: [2023-05-10 12:37:41,702] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +31: [2023-05-10 12:37:41,702] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +31: [2023-05-10 12:37:41,702] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +31: [2023-05-10 12:37:41,702] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +31: [2023-05-10 12:37:41,702] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +31: [2023-05-10 12:37:41,703] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +31: [2023-05-10 12:37:41,703] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... + 5: [2023-05-10 12:37:41,703] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... + 1: [2023-05-10 12:37:41,704] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt... +21: [2023-05-10 12:37:41,704] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. + 8: [2023-05-10 12:37:41,704] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +21: [2023-05-10 12:37:41,704] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. + 5: [2023-05-10 12:37:41,704] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +28: [2023-05-10 12:37:41,704] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt. + 5: [2023-05-10 12:37:41,704] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... + 5: [2023-05-10 12:37:41,704] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +28: [2023-05-10 12:37:41,704] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt. +28: [2023-05-10 12:37:41,704] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt. +13: [2023-05-10 12:37:41,704] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +13: [2023-05-10 12:37:41,704] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +28: [2023-05-10 12:37:41,704] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt. +13: [2023-05-10 12:37:41,704] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +11: [2023-05-10 12:37:41,705] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +30: [2023-05-10 12:37:41,705] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +30: [2023-05-10 12:37:41,705] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +30: [2023-05-10 12:37:41,706] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +13: [2023-05-10 12:37:41,706] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +30: [2023-05-10 12:37:41,706] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +30: [2023-05-10 12:37:41,706] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. + 2: [2023-05-10 12:37:41,706] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +30: [2023-05-10 12:37:41,706] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +15: [2023-05-10 12:37:41,706] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +15: [2023-05-10 12:37:41,707] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +10: [2023-05-10 12:37:41,707] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... + 3: [2023-05-10 12:37:41,707] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... + 8: [2023-05-10 12:37:41,707] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +30: [2023-05-10 12:37:41,707] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +30: [2023-05-10 12:37:41,708] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... + 1: [2023-05-10 12:37:41,708] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. + 1: [2023-05-10 12:37:41,708] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. + 1: [2023-05-10 12:37:41,709] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... + 1: [2023-05-10 12:37:41,709] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +21: [2023-05-10 12:37:41,709] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... + 8: [2023-05-10 12:37:41,709] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... + 3: [2023-05-10 12:37:41,710] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... + 1: [2023-05-10 12:37:41,710] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. + 1: [2023-05-10 12:37:41,710] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. + 1: [2023-05-10 12:37:41,710] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +15: [2023-05-10 12:37:41,710] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +21: [2023-05-10 12:37:41,711] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +11: [2023-05-10 12:37:41,711] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. + 7: [2023-05-10 12:37:41,711] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +23: [2023-05-10 12:37:41,712] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +23: [2023-05-10 12:37:41,712] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... + 1: [2023-05-10 12:37:41,713] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +23: [2023-05-10 12:37:41,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +23: [2023-05-10 12:37:41,713] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +28: [2023-05-10 12:37:41,713] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +28: [2023-05-10 12:37:41,714] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... + 2: [2023-05-10 12:37:41,714] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +28: [2023-05-10 12:37:41,714] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... + 9: [2023-05-10 12:37:41,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. + 9: [2023-05-10 12:37:41,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. + 2: [2023-05-10 12:37:41,714] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... + 9: [2023-05-10 12:37:41,714] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... + 9: [2023-05-10 12:37:41,714] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +28: [2023-05-10 12:37:41,714] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +31: [2023-05-10 12:37:41,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +23: [2023-05-10 12:37:41,715] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +23: [2023-05-10 12:37:41,715] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. + 9: [2023-05-10 12:37:41,715] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. + 9: [2023-05-10 12:37:41,715] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +23: [2023-05-10 12:37:41,715] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... + 9: [2023-05-10 12:37:41,715] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... + 7: [2023-05-10 12:37:41,715] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. + 7: [2023-05-10 12:37:41,715] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. + 7: [2023-05-10 12:37:41,715] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. + 2: [2023-05-10 12:37:41,715] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +23: [2023-05-10 12:37:41,716] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +31: [2023-05-10 12:37:41,716] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. + 9: [2023-05-10 12:37:41,716] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... + 8: [2023-05-10 12:37:41,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +13: [2023-05-10 12:37:41,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +13: [2023-05-10 12:37:41,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... + 8: [2023-05-10 12:37:41,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +13: [2023-05-10 12:37:41,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +21: [2023-05-10 12:37:41,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +21: [2023-05-10 12:37:41,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +11: [2023-05-10 12:37:41,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... + 8: [2023-05-10 12:37:41,722] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +11: [2023-05-10 12:37:41,722] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +30: [2023-05-10 12:37:41,722] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +30: [2023-05-10 12:37:41,722] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. + 7: [2023-05-10 12:37:41,723] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... + 1: [2023-05-10 12:37:41,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. + 1: [2023-05-10 12:37:41,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. + 1: [2023-05-10 12:37:41,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +31: [2023-05-10 12:37:41,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... + 7: [2023-05-10 12:37:41,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... + 7: [2023-05-10 12:37:41,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +22: [2023-05-10 12:37:41,725] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +22: [2023-05-10 12:37:41,725] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +22: [2023-05-10 12:37:41,725] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +22: [2023-05-10 12:37:41,725] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +22: [2023-05-10 12:37:41,725] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +22: [2023-05-10 12:37:41,725] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +22: [2023-05-10 12:37:41,725] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +22: [2023-05-10 12:37:41,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +22: [2023-05-10 12:37:41,725] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +22: [2023-05-10 12:37:41,726] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +28: [2023-05-10 12:37:41,725] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +22: [2023-05-10 12:37:41,726] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt... +22: [2023-05-10 12:37:41,726] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt... +28: [2023-05-10 12:37:41,726] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +28: [2023-05-10 12:37:41,726] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt... +28: [2023-05-10 12:37:41,726] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt... +31: [2023-05-10 12:37:41,726] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +22: [2023-05-10 12:37:41,726] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt... +22: [2023-05-10 12:37:41,727] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +23: [2023-05-10 12:37:41,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +23: [2023-05-10 12:37:41,726] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +23: [2023-05-10 12:37:41,726] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. + 9: [2023-05-10 12:37:41,726] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. + 7: [2023-05-10 12:37:41,727] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +22: [2023-05-10 12:37:41,727] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt... +22: [2023-05-10 12:37:41,727] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +31: [2023-05-10 12:37:41,727] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +28: [2023-05-10 12:37:41,728] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +28: [2023-05-10 12:37:41,728] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt... + 9: [2023-05-10 12:37:41,728] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. + 9: [2023-05-10 12:37:41,729] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. + 8: [2023-05-10 12:37:41,731] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +30: [2023-05-10 12:37:41,731] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +30: [2023-05-10 12:37:41,732] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +30: [2023-05-10 12:37:41,733] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +28: [2023-05-10 12:37:41,733] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +28: [2023-05-10 12:37:41,733] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt... +23: [2023-05-10 12:37:41,733] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... + 1: [2023-05-10 12:37:41,734] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +31: [2023-05-10 12:37:41,735] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +23: [2023-05-10 12:37:41,735] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... + 8: [2023-05-10 12:37:41,735] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt. + 8: [2023-05-10 12:37:41,735] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt. +23: [2023-05-10 12:37:41,735] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... + 8: [2023-05-10 12:37:41,735] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt. + 8: [2023-05-10 12:37:41,735] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt. +31: [2023-05-10 12:37:41,736] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +19: [2023-05-10 12:37:41,736] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +19: [2023-05-10 12:37:41,736] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... + 1: [2023-05-10 12:37:41,736] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... + 1: [2023-05-10 12:37:41,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +19: [2023-05-10 12:37:41,737] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +19: [2023-05-10 12:37:41,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... + 9: [2023-05-10 12:37:41,739] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... + 9: [2023-05-10 12:37:41,739] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +19: [2023-05-10 12:37:41,738] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +19: [2023-05-10 12:37:41,738] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. + 9: [2023-05-10 12:37:41,739] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +19: [2023-05-10 12:37:41,740] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +30: [2023-05-10 12:37:41,740] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +19: [2023-05-10 12:37:41,741] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +30: [2023-05-10 12:37:41,741] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +22: [2023-05-10 12:37:41,742] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +22: [2023-05-10 12:37:41,742] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +23: [2023-05-10 12:37:41,743] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +31: [2023-05-10 12:37:41,744] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... + 9: [2023-05-10 12:37:41,744] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +19: [2023-05-10 12:37:41,744] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt. +19: [2023-05-10 12:37:41,744] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt. + 8: [2023-05-10 12:37:41,744] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... + 1: [2023-05-10 12:37:41,744] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +19: [2023-05-10 12:37:41,745] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt. + 8: [2023-05-10 12:37:41,745] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... + 8: [2023-05-10 12:37:41,745] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... + 8: [2023-05-10 12:37:41,746] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +14: [2023-05-10 12:37:41,746] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt. +14: [2023-05-10 12:37:41,746] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt. +19: [2023-05-10 12:37:41,746] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt. +14: [2023-05-10 12:37:41,747] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt. +14: [2023-05-10 12:37:41,748] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt. +30: [2023-05-10 12:37:41,748] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt. +30: [2023-05-10 12:37:41,748] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt. +30: [2023-05-10 12:37:41,748] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt. +31: [2023-05-10 12:37:41,749] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt. +31: [2023-05-10 12:37:41,749] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt. +31: [2023-05-10 12:37:41,750] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt. +31: [2023-05-10 12:37:41,750] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt. +30: [2023-05-10 12:37:41,750] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +22: [2023-05-10 12:37:41,751] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +30: [2023-05-10 12:37:41,751] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt. +19: [2023-05-10 12:37:41,751] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +22: [2023-05-10 12:37:41,751] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... + 9: [2023-05-10 12:37:41,752] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +23: [2023-05-10 12:37:41,752] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +22: [2023-05-10 12:37:41,753] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... + 1: [2023-05-10 12:37:41,754] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +19: [2023-05-10 12:37:41,755] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +14: [2023-05-10 12:37:41,755] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +14: [2023-05-10 12:37:41,755] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +19: [2023-05-10 12:37:41,756] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +19: [2023-05-10 12:37:41,756] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +27: [2023-05-10 12:37:41,756] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +27: [2023-05-10 12:37:41,756] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +27: [2023-05-10 12:37:41,756] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +27: [2023-05-10 12:37:41,756] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +27: [2023-05-10 12:37:41,756] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +27: [2023-05-10 12:37:41,756] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +27: [2023-05-10 12:37:41,756] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +27: [2023-05-10 12:37:41,757] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +14: [2023-05-10 12:37:41,758] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +30: [2023-05-10 12:37:41,758] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +31: [2023-05-10 12:37:41,758] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +19: [2023-05-10 12:37:41,758] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +19: [2023-05-10 12:37:41,758] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +14: [2023-05-10 12:37:41,758] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... + 5: [2023-05-10 12:37:41,759] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt. + 5: [2023-05-10 12:37:41,759] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt. + 5: [2023-05-10 12:37:41,759] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt. +30: [2023-05-10 12:37:41,759] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... + 5: [2023-05-10 12:37:41,759] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt. +13: [2023-05-10 12:37:41,759] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt. +31: [2023-05-10 12:37:41,760] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +13: [2023-05-10 12:37:41,760] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt. +31: [2023-05-10 12:37:41,760] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +22: [2023-05-10 12:37:41,760] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +31: [2023-05-10 12:37:41,760] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +19: [2023-05-10 12:37:41,761] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +30: [2023-05-10 12:37:41,761] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... + 8: [2023-05-10 12:37:41,761] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +30: [2023-05-10 12:37:41,761] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +12: [2023-05-10 12:37:41,762] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. + 8: [2023-05-10 12:37:41,762] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt... +12: [2023-05-10 12:37:41,762] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +12: [2023-05-10 12:37:41,762] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +13: [2023-05-10 12:37:41,762] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt. +12: [2023-05-10 12:37:41,762] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +12: [2023-05-10 12:37:41,762] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +12: [2023-05-10 12:37:41,762] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +12: [2023-05-10 12:37:41,762] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +13: [2023-05-10 12:37:41,763] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt. + 8: [2023-05-10 12:37:41,764] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. + 8: [2023-05-10 12:37:41,764] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt... +12: [2023-05-10 12:37:41,764] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +22: [2023-05-10 12:37:41,764] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +19: [2023-05-10 12:37:41,764] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... + 8: [2023-05-10 12:37:41,765] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. + 8: [2023-05-10 12:37:41,766] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt... +16: [2023-05-10 12:37:41,767] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +16: [2023-05-10 12:37:41,767] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +16: [2023-05-10 12:37:41,767] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +16: [2023-05-10 12:37:41,767] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +16: [2023-05-10 12:37:41,767] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +16: [2023-05-10 12:37:41,767] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +16: [2023-05-10 12:37:41,768] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +31: [2023-05-10 12:37:41,768] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +13: [2023-05-10 12:37:41,769] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +27: [2023-05-10 12:37:41,769] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +31: [2023-05-10 12:37:41,769] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt... +27: [2023-05-10 12:37:41,769] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +16: [2023-05-10 12:37:41,770] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +14: [2023-05-10 12:37:41,771] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +13: [2023-05-10 12:37:41,771] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +27: [2023-05-10 12:37:41,771] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +27: [2023-05-10 12:37:41,771] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +14: [2023-05-10 12:37:41,771] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +14: [2023-05-10 12:37:41,771] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. + 5: [2023-05-10 12:37:41,772] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +13: [2023-05-10 12:37:41,772] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +14: [2023-05-10 12:37:41,772] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt... +14: [2023-05-10 12:37:41,772] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt... +14: [2023-05-10 12:37:41,772] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt... +22: [2023-05-10 12:37:41,772] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +19: [2023-05-10 12:37:41,772] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. + 5: [2023-05-10 12:37:41,772] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... + 5: [2023-05-10 12:37:41,772] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +19: [2023-05-10 12:37:41,772] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. + 5: [2023-05-10 12:37:41,772] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... + 8: [2023-05-10 12:37:41,773] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +13: [2023-05-10 12:37:41,773] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +19: [2023-05-10 12:37:41,773] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt... +19: [2023-05-10 12:37:41,773] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +19: [2023-05-10 12:37:41,773] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt... + 6: [2023-05-10 12:37:41,774] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt. + 6: [2023-05-10 12:37:41,774] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt. + 8: [2023-05-10 12:37:41,775] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt... +31: [2023-05-10 12:37:41,775] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +31: [2023-05-10 12:37:41,775] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt... + 6: [2023-05-10 12:37:41,776] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt. +19: [2023-05-10 12:37:41,776] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +19: [2023-05-10 12:37:41,776] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt... + 6: [2023-05-10 12:37:41,776] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt. +30: [2023-05-10 12:37:41,776] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +30: [2023-05-10 12:37:41,776] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +14: [2023-05-10 12:37:41,776] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +14: [2023-05-10 12:37:41,776] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt... +30: [2023-05-10 12:37:41,777] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt... +12: [2023-05-10 12:37:41,777] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +30: [2023-05-10 12:37:41,777] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt... +12: [2023-05-10 12:37:41,777] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +12: [2023-05-10 12:37:41,777] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +27: [2023-05-10 12:37:41,778] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +19: [2023-05-10 12:37:41,778] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +27: [2023-05-10 12:37:41,779] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +31: [2023-05-10 12:37:41,781] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +31: [2023-05-10 12:37:41,781] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt... +15: [2023-05-10 12:37:41,781] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt. +15: [2023-05-10 12:37:41,781] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt. +15: [2023-05-10 12:37:41,781] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt. +19: [2023-05-10 12:37:41,781] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +27: [2023-05-10 12:37:41,782] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +15: [2023-05-10 12:37:41,782] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt. +16: [2023-05-10 12:37:41,782] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +16: [2023-05-10 12:37:41,782] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. + 6: [2023-05-10 12:37:41,783] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +13: [2023-05-10 12:37:41,783] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +27: [2023-05-10 12:37:41,784] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +13: [2023-05-10 12:37:41,784] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt... + 6: [2023-05-10 12:37:41,785] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +23: [2023-05-10 12:37:41,785] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt. +23: [2023-05-10 12:37:41,785] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt. +23: [2023-05-10 12:37:41,785] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt. +31: [2023-05-10 12:37:41,786] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +30: [2023-05-10 12:37:41,786] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. + 6: [2023-05-10 12:37:41,786] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +13: [2023-05-10 12:37:41,786] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +13: [2023-05-10 12:37:41,786] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt... +12: [2023-05-10 12:37:41,786] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... + 4: [2023-05-10 12:37:41,786] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt. + 4: [2023-05-10 12:37:41,786] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt. + 4: [2023-05-10 12:37:41,786] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt. + 4: [2023-05-10 12:37:41,786] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt. +23: [2023-05-10 12:37:41,786] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt. + 6: [2023-05-10 12:37:41,786] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +31: [2023-05-10 12:37:41,787] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt... + 5: [2023-05-10 12:37:41,787] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +12: [2023-05-10 12:37:41,787] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... + 5: [2023-05-10 12:37:41,787] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt... +19: [2023-05-10 12:37:41,787] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +19: [2023-05-10 12:37:41,788] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +30: [2023-05-10 12:37:41,788] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt... +30: [2023-05-10 12:37:41,788] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +13: [2023-05-10 12:37:41,788] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +13: [2023-05-10 12:37:41,788] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +13: [2023-05-10 12:37:41,788] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt... +12: [2023-05-10 12:37:41,788] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +13: [2023-05-10 12:37:41,788] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt... + 5: [2023-05-10 12:37:41,788] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. + 5: [2023-05-10 12:37:41,788] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt... +19: [2023-05-10 12:37:41,789] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt... +30: [2023-05-10 12:37:41,789] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt... + 5: [2023-05-10 12:37:41,790] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. + 5: [2023-05-10 12:37:41,790] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt... +15: [2023-05-10 12:37:41,790] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +12: [2023-05-10 12:37:41,791] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +16: [2023-05-10 12:37:41,791] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +16: [2023-05-10 12:37:41,791] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +16: [2023-05-10 12:37:41,791] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +15: [2023-05-10 12:37:41,792] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +25: [2023-05-10 12:37:41,792] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt. +25: [2023-05-10 12:37:41,792] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt. +15: [2023-05-10 12:37:41,793] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +25: [2023-05-10 12:37:41,793] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt. +25: [2023-05-10 12:37:41,793] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt. +15: [2023-05-10 12:37:41,794] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +23: [2023-05-10 12:37:41,795] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... + 6: [2023-05-10 12:37:41,795] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. + 6: [2023-05-10 12:37:41,795] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +23: [2023-05-10 12:37:41,795] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... + 6: [2023-05-10 12:37:41,795] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... + 6: [2023-05-10 12:37:41,795] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... + 4: [2023-05-10 12:37:41,796] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +23: [2023-05-10 12:37:41,796] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... + 4: [2023-05-10 12:37:41,796] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... + 4: [2023-05-10 12:37:41,796] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +23: [2023-05-10 12:37:41,796] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... + 6: [2023-05-10 12:37:41,796] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. + 6: [2023-05-10 12:37:41,796] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. + 6: [2023-05-10 12:37:41,796] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... + 6: [2023-05-10 12:37:41,796] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +16: [2023-05-10 12:37:41,798] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. + 4: [2023-05-10 12:37:41,798] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +12: [2023-05-10 12:37:41,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +16: [2023-05-10 12:37:41,801] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +25: [2023-05-10 12:37:41,802] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +25: [2023-05-10 12:37:41,803] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +15: [2023-05-10 12:37:41,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +15: [2023-05-10 12:37:41,804] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt... + 5: [2023-05-10 12:37:41,805] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +25: [2023-05-10 12:37:41,806] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +25: [2023-05-10 12:37:41,806] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... + 5: [2023-05-10 12:37:41,806] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt... +16: [2023-05-10 12:37:41,808] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +25: [2023-05-10 12:37:41,808] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +25: [2023-05-10 12:37:41,808] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +25: [2023-05-10 12:37:41,808] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +25: [2023-05-10 12:37:41,809] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +25: [2023-05-10 12:37:41,809] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +25: [2023-05-10 12:37:41,809] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +23: [2023-05-10 12:37:41,809] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. + 6: [2023-05-10 12:37:41,809] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. + 6: [2023-05-10 12:37:41,809] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +15: [2023-05-10 12:37:41,809] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +15: [2023-05-10 12:37:41,809] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +15: [2023-05-10 12:37:41,809] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt... +15: [2023-05-10 12:37:41,809] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt... + 6: [2023-05-10 12:37:41,810] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt... + 6: [2023-05-10 12:37:41,810] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt... +25: [2023-05-10 12:37:41,810] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +23: [2023-05-10 12:37:41,811] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt... +25: [2023-05-10 12:37:41,811] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +26: [2023-05-10 12:37:41,811] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +26: [2023-05-10 12:37:41,812] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +26: [2023-05-10 12:37:41,812] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +26: [2023-05-10 12:37:41,812] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +26: [2023-05-10 12:37:41,812] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. + 6: [2023-05-10 12:37:41,812] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +26: [2023-05-10 12:37:41,812] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. + 6: [2023-05-10 12:37:41,812] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt... + 6: [2023-05-10 12:37:41,812] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. + 6: [2023-05-10 12:37:41,812] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt... + 4: [2023-05-10 12:37:41,812] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. + 4: [2023-05-10 12:37:41,813] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt... +26: [2023-05-10 12:37:41,813] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +26: [2023-05-10 12:37:41,814] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +23: [2023-05-10 12:37:41,814] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +23: [2023-05-10 12:37:41,815] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt... + 6: [2023-05-10 12:37:41,815] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. + 6: [2023-05-10 12:37:41,815] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. + 4: [2023-05-10 12:37:41,815] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. + 4: [2023-05-10 12:37:41,816] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt... +23: [2023-05-10 12:37:41,816] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +23: [2023-05-10 12:37:41,816] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt... +23: [2023-05-10 12:37:41,816] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +23: [2023-05-10 12:37:41,816] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt... +25: [2023-05-10 12:37:41,816] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +25: [2023-05-10 12:37:41,817] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt... + 4: [2023-05-10 12:37:41,817] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. + 4: [2023-05-10 12:37:41,817] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt... + 6: [2023-05-10 12:37:41,821] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. + 6: [2023-05-10 12:37:41,821] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +26: [2023-05-10 12:37:41,823] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +15: [2023-05-10 12:37:41,823] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +26: [2023-05-10 12:37:41,824] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +15: [2023-05-10 12:37:41,825] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt... +25: [2023-05-10 12:37:41,826] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. + 6: [2023-05-10 12:37:41,826] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... + 4: [2023-05-10 12:37:41,827] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. + 6: [2023-05-10 12:37:41,827] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... + 4: [2023-05-10 12:37:41,828] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt... +25: [2023-05-10 12:37:41,828] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +25: [2023-05-10 12:37:41,829] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt... + 6: [2023-05-10 12:37:41,830] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +26: [2023-05-10 12:37:41,832] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... + 6: [2023-05-10 12:37:41,832] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +25: [2023-05-10 12:37:41,832] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +26: [2023-05-10 12:37:41,833] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... + 0: [2023-05-10 12:37:41,833] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt. + 0: [2023-05-10 12:37:41,833] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt. +25: [2023-05-10 12:37:41,833] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +12: [2023-05-10 12:37:41,833] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt. +12: [2023-05-10 12:37:41,834] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt. +12: [2023-05-10 12:37:41,834] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt. +25: [2023-05-10 12:37:41,834] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt... + 0: [2023-05-10 12:37:41,834] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt. +25: [2023-05-10 12:37:41,834] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. + 0: [2023-05-10 12:37:41,834] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt. + 3: [2023-05-10 12:37:41,834] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt. + 3: [2023-05-10 12:37:41,835] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt. +25: [2023-05-10 12:37:41,835] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... + 3: [2023-05-10 12:37:41,835] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt. +12: [2023-05-10 12:37:41,835] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt. + 3: [2023-05-10 12:37:41,836] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt. +25: [2023-05-10 12:37:41,836] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt... +10: [2023-05-10 12:37:41,836] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt. +10: [2023-05-10 12:37:41,836] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt. +10: [2023-05-10 12:37:41,836] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt. + 2: [2023-05-10 12:37:41,836] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt. + 2: [2023-05-10 12:37:41,836] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt. + 2: [2023-05-10 12:37:41,836] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt. + 2: [2023-05-10 12:37:41,836] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt. +17: [2023-05-10 12:37:41,836] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt. +17: [2023-05-10 12:37:41,836] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt. +17: [2023-05-10 12:37:41,836] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt. +17: [2023-05-10 12:37:41,836] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt. +10: [2023-05-10 12:37:41,837] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt. +16: [2023-05-10 12:37:41,837] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt. +16: [2023-05-10 12:37:41,837] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt. +16: [2023-05-10 12:37:41,837] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt. +18: [2023-05-10 12:37:41,838] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt. +18: [2023-05-10 12:37:41,838] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt. +11: [2023-05-10 12:37:41,838] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt. +11: [2023-05-10 12:37:41,838] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt. +11: [2023-05-10 12:37:41,838] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt. +16: [2023-05-10 12:37:41,838] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt. +11: [2023-05-10 12:37:41,838] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt. +18: [2023-05-10 12:37:41,838] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt. +18: [2023-05-10 12:37:41,838] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt. +25: [2023-05-10 12:37:41,840] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +26: [2023-05-10 12:37:41,840] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +26: [2023-05-10 12:37:41,841] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +25: [2023-05-10 12:37:41,842] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +12: [2023-05-10 12:37:41,843] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +25: [2023-05-10 12:37:41,843] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. + 0: [2023-05-10 12:37:41,843] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... + 0: [2023-05-10 12:37:41,843] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... + 0: [2023-05-10 12:37:41,844] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... + 3: [2023-05-10 12:37:41,844] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... + 3: [2023-05-10 12:37:41,844] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... + 3: [2023-05-10 12:37:41,845] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... + 3: [2023-05-10 12:37:41,845] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +12: [2023-05-10 12:37:41,845] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +10: [2023-05-10 12:37:41,845] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +10: [2023-05-10 12:37:41,845] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... + 0: [2023-05-10 12:37:41,845] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +17: [2023-05-10 12:37:41,846] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +12: [2023-05-10 12:37:41,846] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +17: [2023-05-10 12:37:41,846] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +12: [2023-05-10 12:37:41,847] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +17: [2023-05-10 12:37:41,847] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +11: [2023-05-10 12:37:41,847] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +18: [2023-05-10 12:37:41,847] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +17: [2023-05-10 12:37:41,848] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +10: [2023-05-10 12:37:41,848] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +10: [2023-05-10 12:37:41,848] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +16: [2023-05-10 12:37:41,848] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +16: [2023-05-10 12:37:41,848] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +16: [2023-05-10 12:37:41,848] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +18: [2023-05-10 12:37:41,848] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +18: [2023-05-10 12:37:41,849] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +25: [2023-05-10 12:37:41,849] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +18: [2023-05-10 12:37:41,849] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +18: [2023-05-10 12:37:41,849] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +18: [2023-05-10 12:37:41,849] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +18: [2023-05-10 12:37:41,849] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +18: [2023-05-10 12:37:41,849] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +18: [2023-05-10 12:37:41,849] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +18: [2023-05-10 12:37:41,849] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +26: [2023-05-10 12:37:41,850] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +27: [2023-05-10 12:37:41,850] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt. + 2: [2023-05-10 12:37:41,850] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +16: [2023-05-10 12:37:41,850] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +26: [2023-05-10 12:37:41,851] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +18: [2023-05-10 12:37:41,851] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +18: [2023-05-10 12:37:41,851] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +27: [2023-05-10 12:37:41,851] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt. +11: [2023-05-10 12:37:41,851] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... + 9: [2023-05-10 12:37:41,852] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt. + 9: [2023-05-10 12:37:41,852] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt. + 9: [2023-05-10 12:37:41,852] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt. + 9: [2023-05-10 12:37:41,852] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt. +11: [2023-05-10 12:37:41,853] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +11: [2023-05-10 12:37:41,853] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... + 2: [2023-05-10 12:37:41,854] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +25: [2023-05-10 12:37:41,854] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... + 2: [2023-05-10 12:37:41,854] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... + 2: [2023-05-10 12:37:41,855] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +27: [2023-05-10 12:37:41,856] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt. +27: [2023-05-10 12:37:41,856] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt. +12: [2023-05-10 12:37:41,857] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. + 3: [2023-05-10 12:37:41,857] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +12: [2023-05-10 12:37:41,857] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt... + 3: [2023-05-10 12:37:41,857] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt... + 3: [2023-05-10 12:37:41,858] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. + 3: [2023-05-10 12:37:41,858] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt... +27: [2023-05-10 12:37:41,859] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +13: [2023-05-10 12:37:41,860] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +13: [2023-05-10 12:37:41,860] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +13: [2023-05-10 12:37:41,860] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +11: [2023-05-10 12:37:41,860] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. + 4: [2023-05-10 12:37:41,860] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. + 4: [2023-05-10 12:37:41,860] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +21: [2023-05-10 12:37:41,860] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt. + 4: [2023-05-10 12:37:41,860] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... + 4: [2023-05-10 12:37:41,860] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +21: [2023-05-10 12:37:41,860] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt. +11: [2023-05-10 12:37:41,860] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt... + 4: [2023-05-10 12:37:41,860] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. + 4: [2023-05-10 12:37:41,860] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +13: [2023-05-10 12:37:41,860] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +21: [2023-05-10 12:37:41,860] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt. + 4: [2023-05-10 12:37:41,861] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +13: [2023-05-10 12:37:41,861] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +13: [2023-05-10 12:37:41,861] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +21: [2023-05-10 12:37:41,861] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt. +10: [2023-05-10 12:37:41,861] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. + 3: [2023-05-10 12:37:41,862] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. + 3: [2023-05-10 12:37:41,862] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. + 4: [2023-05-10 12:37:41,862] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +10: [2023-05-10 12:37:41,862] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt... +27: [2023-05-10 12:37:41,862] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +10: [2023-05-10 12:37:41,862] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +13: [2023-05-10 12:37:41,862] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... + 3: [2023-05-10 12:37:41,862] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt... + 3: [2023-05-10 12:37:41,862] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt... +10: [2023-05-10 12:37:41,862] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt... +13: [2023-05-10 12:37:41,862] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +18: [2023-05-10 12:37:41,861] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +18: [2023-05-10 12:37:41,862] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt... + 9: [2023-05-10 12:37:41,863] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... + 9: [2023-05-10 12:37:41,863] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +17: [2023-05-10 12:37:41,862] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +17: [2023-05-10 12:37:41,863] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +12: [2023-05-10 12:37:41,863] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +12: [2023-05-10 12:37:41,863] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt... +17: [2023-05-10 12:37:41,863] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt... +17: [2023-05-10 12:37:41,864] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt... +17: [2023-05-10 12:37:41,864] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +16: [2023-05-10 12:37:41,864] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +16: [2023-05-10 12:37:41,864] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +16: [2023-05-10 12:37:41,864] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +16: [2023-05-10 12:37:41,865] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt... +16: [2023-05-10 12:37:41,865] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt... +27: [2023-05-10 12:37:41,865] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +16: [2023-05-10 12:37:41,865] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt... + 9: [2023-05-10 12:37:41,866] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +27: [2023-05-10 12:37:41,866] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +17: [2023-05-10 12:37:41,866] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt... + 0: [2023-05-10 12:37:41,866] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. + 9: [2023-05-10 12:37:41,866] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... + 0: [2023-05-10 12:37:41,866] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. + 2: [2023-05-10 12:37:41,866] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. + 0: [2023-05-10 12:37:41,867] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt... + 0: [2023-05-10 12:37:41,867] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. + 0: [2023-05-10 12:37:41,868] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt... + 2: [2023-05-10 12:37:41,868] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt... + 0: [2023-05-10 12:37:41,869] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt... + 0: [2023-05-10 12:37:41,869] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. + 7: [2023-05-10 12:37:41,870] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt. + 7: [2023-05-10 12:37:41,870] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt. + 7: [2023-05-10 12:37:41,870] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt. + 7: [2023-05-10 12:37:41,870] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_12-model_01-model_states.pt. + 0: [2023-05-10 12:37:41,870] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt... +21: [2023-05-10 12:37:41,871] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +11: [2023-05-10 12:37:41,871] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +11: [2023-05-10 12:37:41,871] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt... +13: [2023-05-10 12:37:41,871] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. + 4: [2023-05-10 12:37:41,872] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +12: [2023-05-10 12:37:41,872] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +10: [2023-05-10 12:37:41,872] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +10: [2023-05-10 12:37:41,872] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +17: [2023-05-10 12:37:41,873] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +18: [2023-05-10 12:37:41,873] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +24: [2023-05-10 12:37:41,874] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +21: [2023-05-10 12:37:41,874] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +12: [2023-05-10 12:37:41,874] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt... +24: [2023-05-10 12:37:41,874] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +24: [2023-05-10 12:37:41,874] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +17: [2023-05-10 12:37:41,874] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt... +10: [2023-05-10 12:37:41,874] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt... +10: [2023-05-10 12:37:41,874] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt... +21: [2023-05-10 12:37:41,875] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +27: [2023-05-10 12:37:41,874] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +18: [2023-05-10 12:37:41,875] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt... +12: [2023-05-10 12:37:41,875] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +21: [2023-05-10 12:37:41,875] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +24: [2023-05-10 12:37:41,875] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +16: [2023-05-10 12:37:41,875] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +27: [2023-05-10 12:37:41,875] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +24: [2023-05-10 12:37:41,875] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +24: [2023-05-10 12:37:41,875] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +24: [2023-05-10 12:37:41,876] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... + 4: [2023-05-10 12:37:41,876] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +27: [2023-05-10 12:37:41,876] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt... +27: [2023-05-10 12:37:41,876] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt... +16: [2023-05-10 12:37:41,876] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt... + 9: [2023-05-10 12:37:41,876] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. + 9: [2023-05-10 12:37:41,877] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt... +11: [2023-05-10 12:37:41,876] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. + 4: [2023-05-10 12:37:41,877] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +24: [2023-05-10 12:37:41,877] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +12: [2023-05-10 12:37:41,877] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt... + 5: [2023-05-10 12:37:41,878] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. + 5: [2023-05-10 12:37:41,878] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. + 5: [2023-05-10 12:37:41,878] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. + 5: [2023-05-10 12:37:41,878] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +11: [2023-05-10 12:37:41,878] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt... +11: [2023-05-10 12:37:41,879] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +11: [2023-05-10 12:37:41,879] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +11: [2023-05-10 12:37:41,879] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +11: [2023-05-10 12:37:41,879] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... + 5: [2023-05-10 12:37:41,879] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... + 9: [2023-05-10 12:37:41,879] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. + 5: [2023-05-10 12:37:41,879] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... + 9: [2023-05-10 12:37:41,879] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt... + 5: [2023-05-10 12:37:41,879] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... + 5: [2023-05-10 12:37:41,879] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +11: [2023-05-10 12:37:41,879] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +11: [2023-05-10 12:37:41,879] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +11: [2023-05-10 12:37:41,880] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +11: [2023-05-10 12:37:41,880] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +13: [2023-05-10 12:37:41,880] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +13: [2023-05-10 12:37:41,880] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... + 2: [2023-05-10 12:37:41,880] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. + 7: [2023-05-10 12:37:41,880] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +14: [2023-05-10 12:37:41,880] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +14: [2023-05-10 12:37:41,880] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. + 4: [2023-05-10 12:37:41,880] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +14: [2023-05-10 12:37:41,880] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... + 7: [2023-05-10 12:37:41,880] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... +14: [2023-05-10 12:37:41,881] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +14: [2023-05-10 12:37:41,881] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +27: [2023-05-10 12:37:41,881] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +27: [2023-05-10 12:37:41,881] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt... + 8: [2023-05-10 12:37:41,881] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. + 8: [2023-05-10 12:37:41,882] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +11: [2023-05-10 12:37:41,881] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. + 8: [2023-05-10 12:37:41,882] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. + 8: [2023-05-10 12:37:41,882] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. + 8: [2023-05-10 12:37:41,882] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. + 8: [2023-05-10 12:37:41,882] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... + 8: [2023-05-10 12:37:41,882] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +20: [2023-05-10 12:37:41,882] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +20: [2023-05-10 12:37:41,882] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +20: [2023-05-10 12:37:41,882] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +20: [2023-05-10 12:37:41,882] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +20: [2023-05-10 12:37:41,882] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +20: [2023-05-10 12:37:41,882] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +20: [2023-05-10 12:37:41,882] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +20: [2023-05-10 12:37:41,882] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... + 0: [2023-05-10 12:37:41,882] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. + 0: [2023-05-10 12:37:41,882] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. + 0: [2023-05-10 12:37:41,882] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... + 0: [2023-05-10 12:37:41,883] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... + 7: [2023-05-10 12:37:41,882] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... + 2: [2023-05-10 12:37:41,883] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt... +14: [2023-05-10 12:37:41,883] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +14: [2023-05-10 12:37:41,883] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... + 0: [2023-05-10 12:37:41,883] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. + 0: [2023-05-10 12:37:41,883] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +15: [2023-05-10 12:37:41,883] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +14: [2023-05-10 12:37:41,883] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +15: [2023-05-10 12:37:41,883] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... + 7: [2023-05-10 12:37:41,883] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt... + 8: [2023-05-10 12:37:41,883] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +18: [2023-05-10 12:37:41,883] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +11: [2023-05-10 12:37:41,883] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt... +18: [2023-05-10 12:37:41,884] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt... +18: [2023-05-10 12:37:41,884] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +18: [2023-05-10 12:37:41,884] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +15: [2023-05-10 12:37:41,884] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +15: [2023-05-10 12:37:41,884] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +18: [2023-05-10 12:37:41,885] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. + 2: [2023-05-10 12:37:41,885] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +18: [2023-05-10 12:37:41,885] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt... + 0: [2023-05-10 12:37:41,885] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... + 0: [2023-05-10 12:37:41,885] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +21: [2023-05-10 12:37:41,885] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +28: [2023-05-10 12:37:41,885] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt. +15: [2023-05-10 12:37:41,885] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +21: [2023-05-10 12:37:41,885] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt... +28: [2023-05-10 12:37:41,885] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt. +28: [2023-05-10 12:37:41,885] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt. + 4: [2023-05-10 12:37:41,885] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... + 2: [2023-05-10 12:37:41,885] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. + 2: [2023-05-10 12:37:41,885] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. + 2: [2023-05-10 12:37:41,886] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +15: [2023-05-10 12:37:41,886] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. + 2: [2023-05-10 12:37:41,886] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +24: [2023-05-10 12:37:41,886] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +27: [2023-05-10 12:37:41,885] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +27: [2023-05-10 12:37:41,886] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt... +28: [2023-05-10 12:37:41,886] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt. + 9: [2023-05-10 12:37:41,886] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. + 9: [2023-05-10 12:37:41,886] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt... + 9: [2023-05-10 12:37:41,887] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +21: [2023-05-10 12:37:41,887] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +21: [2023-05-10 12:37:41,887] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... + 2: [2023-05-10 12:37:41,887] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. + 2: [2023-05-10 12:37:41,887] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. + 2: [2023-05-10 12:37:41,887] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. + 2: [2023-05-10 12:37:41,887] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +21: [2023-05-10 12:37:41,888] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. + 2: [2023-05-10 12:37:41,888] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt... + 9: [2023-05-10 12:37:41,888] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt... +15: [2023-05-10 12:37:41,888] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +24: [2023-05-10 12:37:41,889] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +15: [2023-05-10 12:37:41,889] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +21: [2023-05-10 12:37:41,889] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +21: [2023-05-10 12:37:41,889] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +13: [2023-05-10 12:37:41,889] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +21: [2023-05-10 12:37:41,890] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... + 4: [2023-05-10 12:37:41,890] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... + 2: [2023-05-10 12:37:41,890] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +21: [2023-05-10 12:37:41,891] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... + 2: [2023-05-10 12:37:41,892] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt... +13: [2023-05-10 12:37:41,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +28: [2023-05-10 12:37:41,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +28: [2023-05-10 12:37:41,892] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +21: [2023-05-10 12:37:41,892] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +28: [2023-05-10 12:37:41,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. + 4: [2023-05-10 12:37:41,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +28: [2023-05-10 12:37:41,892] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +28: [2023-05-10 12:37:41,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +28: [2023-05-10 12:37:41,893] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +28: [2023-05-10 12:37:41,893] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. + 7: [2023-05-10 12:37:41,893] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. + 8: [2023-05-10 12:37:41,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. + 7: [2023-05-10 12:37:41,894] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt... +24: [2023-05-10 12:37:41,894] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +18: [2023-05-10 12:37:41,894] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +28: [2023-05-10 12:37:41,895] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +20: [2023-05-10 12:37:41,895] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +11: [2023-05-10 12:37:41,895] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +11: [2023-05-10 12:37:41,895] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +11: [2023-05-10 12:37:41,895] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +11: [2023-05-10 12:37:41,895] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +14: [2023-05-10 12:37:41,894] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +28: [2023-05-10 12:37:41,895] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +28: [2023-05-10 12:37:41,895] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +18: [2023-05-10 12:37:41,896] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +15: [2023-05-10 12:37:41,895] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +28: [2023-05-10 12:37:41,896] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +20: [2023-05-10 12:37:41,897] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +28: [2023-05-10 12:37:41,897] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +20: [2023-05-10 12:37:41,897] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +24: [2023-05-10 12:37:41,898] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... + 2: [2023-05-10 12:37:41,898] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +15: [2023-05-10 12:37:41,898] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. + 7: [2023-05-10 12:37:41,898] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. + 7: [2023-05-10 12:37:41,898] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt... + 8: [2023-05-10 12:37:41,900] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. + 8: [2023-05-10 12:37:41,900] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +13: [2023-05-10 12:37:41,900] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +13: [2023-05-10 12:37:41,900] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +18: [2023-05-10 12:37:41,901] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. + 4: [2023-05-10 12:37:41,901] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +18: [2023-05-10 12:37:41,901] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. + 2: [2023-05-10 12:37:41,902] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. + 2: [2023-05-10 12:37:41,902] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +21: [2023-05-10 12:37:41,902] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +21: [2023-05-10 12:37:41,902] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. + 8: [2023-05-10 12:37:41,902] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... + 5: [2023-05-10 12:37:41,902] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. + 5: [2023-05-10 12:37:41,902] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +21: [2023-05-10 12:37:41,903] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. + 0: [2023-05-10 12:37:41,903] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. + 5: [2023-05-10 12:37:41,903] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. + 5: [2023-05-10 12:37:41,903] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +20: [2023-05-10 12:37:41,903] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +24: [2023-05-10 12:37:41,903] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +24: [2023-05-10 12:37:41,904] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +21: [2023-05-10 12:37:41,904] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt... +14: [2023-05-10 12:37:41,904] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +11: [2023-05-10 12:37:41,905] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +21: [2023-05-10 12:37:41,905] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt... +11: [2023-05-10 12:37:41,905] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +11: [2023-05-10 12:37:41,906] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +11: [2023-05-10 12:37:41,907] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... + 7: [2023-05-10 12:37:41,907] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +21: [2023-05-10 12:37:41,907] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. +20: [2023-05-10 12:37:41,908] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +14: [2023-05-10 12:37:41,908] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. + 7: [2023-05-10 12:37:41,908] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt... +15: [2023-05-10 12:37:41,908] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +15: [2023-05-10 12:37:41,909] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +13: [2023-05-10 12:37:41,909] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... + 8: [2023-05-10 12:37:41,909] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +18: [2023-05-10 12:37:41,910] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +18: [2023-05-10 12:37:41,910] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +20: [2023-05-10 12:37:41,910] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +21: [2023-05-10 12:37:41,910] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt... + 7: [2023-05-10 12:37:41,911] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_00-model_states.pt. + 0: [2023-05-10 12:37:41,911] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. + 8: [2023-05-10 12:37:41,912] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... + 5: [2023-05-10 12:37:41,912] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... + 0: [2023-05-10 12:37:41,912] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... + 5: [2023-05-10 12:37:41,912] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... + 7: [2023-05-10 12:37:41,912] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt... +21: [2023-05-10 12:37:41,912] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +14: [2023-05-10 12:37:41,912] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +20: [2023-05-10 12:37:41,912] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +14: [2023-05-10 12:37:41,913] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +24: [2023-05-10 12:37:41,913] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... + 5: [2023-05-10 12:37:41,913] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... + 5: [2023-05-10 12:37:41,913] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +20: [2023-05-10 12:37:41,913] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +24: [2023-05-10 12:37:41,913] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +28: [2023-05-10 12:37:41,914] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +28: [2023-05-10 12:37:41,914] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +28: [2023-05-10 12:37:41,915] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt... +28: [2023-05-10 12:37:41,915] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. + 2: [2023-05-10 12:37:41,915] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +28: [2023-05-10 12:37:41,915] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt... + 2: [2023-05-10 12:37:41,916] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... + 8: [2023-05-10 12:37:41,916] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +21: [2023-05-10 12:37:41,917] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +14: [2023-05-10 12:37:41,918] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +21: [2023-05-10 12:37:41,918] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +28: [2023-05-10 12:37:41,918] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +15: [2023-05-10 12:37:41,918] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. + 2: [2023-05-10 12:37:41,919] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... + 2: [2023-05-10 12:37:41,920] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. + 0: [2023-05-10 12:37:41,920] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +28: [2023-05-10 12:37:41,921] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. + 0: [2023-05-10 12:37:41,921] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +28: [2023-05-10 12:37:41,921] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt... +14: [2023-05-10 12:37:41,922] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +14: [2023-05-10 12:37:41,922] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +28: [2023-05-10 12:37:41,922] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +15: [2023-05-10 12:37:41,922] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +21: [2023-05-10 12:37:41,922] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. + 0: [2023-05-10 12:37:41,922] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +28: [2023-05-10 12:37:41,923] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +28: [2023-05-10 12:37:41,923] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +29: [2023-05-10 12:37:41,924] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +29: [2023-05-10 12:37:41,924] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +28: [2023-05-10 12:37:41,925] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt... + 8: [2023-05-10 12:37:41,925] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +29: [2023-05-10 12:37:41,926] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +29: [2023-05-10 12:37:41,926] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +31: [2023-05-10 12:37:41,927] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt. +31: [2023-05-10 12:37:41,927] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt. +31: [2023-05-10 12:37:41,927] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt. +31: [2023-05-10 12:37:41,927] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt. +15: [2023-05-10 12:37:41,928] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +29: [2023-05-10 12:37:41,928] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +29: [2023-05-10 12:37:41,928] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +29: [2023-05-10 12:37:41,928] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +21: [2023-05-10 12:37:41,928] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +29: [2023-05-10 12:37:41,929] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt. +29: [2023-05-10 12:37:41,929] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt. +29: [2023-05-10 12:37:41,929] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt. +14: [2023-05-10 12:37:41,929] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt. +14: [2023-05-10 12:37:41,929] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt. +14: [2023-05-10 12:37:41,930] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt. +29: [2023-05-10 12:37:41,930] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt. +14: [2023-05-10 12:37:41,930] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt. + 0: [2023-05-10 12:37:41,930] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +21: [2023-05-10 12:37:41,931] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +28: [2023-05-10 12:37:41,931] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +15: [2023-05-10 12:37:41,931] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +29: [2023-05-10 12:37:41,931] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... + 0: [2023-05-10 12:37:41,932] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... + 2: [2023-05-10 12:37:41,933] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +21: [2023-05-10 12:37:41,933] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +28: [2023-05-10 12:37:41,934] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +31: [2023-05-10 12:37:41,937] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +31: [2023-05-10 12:37:41,937] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +31: [2023-05-10 12:37:41,938] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +28: [2023-05-10 12:37:41,938] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +14: [2023-05-10 12:37:41,939] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +14: [2023-05-10 12:37:41,940] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +31: [2023-05-10 12:37:41,940] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +29: [2023-05-10 12:37:41,940] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +14: [2023-05-10 12:37:41,940] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +29: [2023-05-10 12:37:41,940] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +29: [2023-05-10 12:37:41,941] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +14: [2023-05-10 12:37:41,941] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +29: [2023-05-10 12:37:41,941] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +29: [2023-05-10 12:37:41,943] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +29: [2023-05-10 12:37:41,946] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +28: [2023-05-10 12:37:41,947] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +29: [2023-05-10 12:37:41,947] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +22: [2023-05-10 12:37:41,951] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt. +22: [2023-05-10 12:37:41,951] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt. +22: [2023-05-10 12:37:41,951] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt. +22: [2023-05-10 12:37:41,951] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt. +29: [2023-05-10 12:37:41,952] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +14: [2023-05-10 12:37:41,952] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +14: [2023-05-10 12:37:41,953] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt... +19: [2023-05-10 12:37:41,953] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt. +19: [2023-05-10 12:37:41,953] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt. +31: [2023-05-10 12:37:41,953] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +31: [2023-05-10 12:37:41,954] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt... +31: [2023-05-10 12:37:41,955] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +31: [2023-05-10 12:37:41,955] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt... +14: [2023-05-10 12:37:41,955] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +14: [2023-05-10 12:37:41,956] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt... +19: [2023-05-10 12:37:41,956] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt. +19: [2023-05-10 12:37:41,956] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt. +29: [2023-05-10 12:37:41,957] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +29: [2023-05-10 12:37:41,961] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +14: [2023-05-10 12:37:41,962] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +19: [2023-05-10 12:37:41,963] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +31: [2023-05-10 12:37:41,964] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +19: [2023-05-10 12:37:41,964] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +19: [2023-05-10 12:37:41,964] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +14: [2023-05-10 12:37:41,965] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt... +22: [2023-05-10 12:37:41,965] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +29: [2023-05-10 12:37:41,965] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +22: [2023-05-10 12:37:41,966] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +22: [2023-05-10 12:37:41,966] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +29: [2023-05-10 12:37:41,966] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt... +31: [2023-05-10 12:37:41,966] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt... +22: [2023-05-10 12:37:41,966] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +30: [2023-05-10 12:37:41,967] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt. +30: [2023-05-10 12:37:41,967] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt. +19: [2023-05-10 12:37:41,967] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +14: [2023-05-10 12:37:41,968] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +17: [2023-05-10 12:37:41,968] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +17: [2023-05-10 12:37:41,968] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +17: [2023-05-10 12:37:41,968] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +17: [2023-05-10 12:37:41,968] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +29: [2023-05-10 12:37:41,968] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +29: [2023-05-10 12:37:41,968] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +17: [2023-05-10 12:37:41,968] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +17: [2023-05-10 12:37:41,968] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +29: [2023-05-10 12:37:41,968] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt... +29: [2023-05-10 12:37:41,968] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +17: [2023-05-10 12:37:41,968] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +17: [2023-05-10 12:37:41,968] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +29: [2023-05-10 12:37:41,968] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt... +14: [2023-05-10 12:37:41,969] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt... +29: [2023-05-10 12:37:41,969] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt... +31: [2023-05-10 12:37:41,969] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +31: [2023-05-10 12:37:41,971] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt... +29: [2023-05-10 12:37:41,971] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +30: [2023-05-10 12:37:41,972] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt. +30: [2023-05-10 12:37:41,973] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt. +30: [2023-05-10 12:37:41,977] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +30: [2023-05-10 12:37:41,977] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +17: [2023-05-10 12:37:41,979] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +17: [2023-05-10 12:37:41,979] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +29: [2023-05-10 12:37:41,980] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +30: [2023-05-10 12:37:41,982] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +17: [2023-05-10 12:37:41,983] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +17: [2023-05-10 12:37:41,983] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +30: [2023-05-10 12:37:41,986] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +30: [2023-05-10 12:37:41,992] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +30: [2023-05-10 12:37:41,992] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +30: [2023-05-10 12:37:41,992] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +30: [2023-05-10 12:37:41,992] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +30: [2023-05-10 12:37:41,992] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +30: [2023-05-10 12:37:41,992] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +30: [2023-05-10 12:37:41,992] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +30: [2023-05-10 12:37:41,994] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +17: [2023-05-10 12:37:41,994] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +17: [2023-05-10 12:37:41,994] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +30: [2023-05-10 12:37:41,995] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +30: [2023-05-10 12:37:41,995] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt... +17: [2023-05-10 12:37:41,997] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +17: [2023-05-10 12:37:41,997] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +30: [2023-05-10 12:37:42,002] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +30: [2023-05-10 12:37:42,002] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt... +30: [2023-05-10 12:37:42,004] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +30: [2023-05-10 12:37:42,006] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +30: [2023-05-10 12:37:42,006] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +30: [2023-05-10 12:37:42,008] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt... +30: [2023-05-10 12:37:42,008] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt... +30: [2023-05-10 12:37:42,009] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +30: [2023-05-10 12:37:42,014] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +30: [2023-05-10 12:37:42,015] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +30: [2023-05-10 12:37:42,019] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +30: [2023-05-10 12:37:42,023] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +30: [2023-05-10 12:37:42,025] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +30: [2023-05-10 12:37:42,033] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... + 7: [2023-05-10 12:37:42,048] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. + 7: [2023-05-10 12:37:42,048] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... + 7: [2023-05-10 12:37:42,048] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. + 7: [2023-05-10 12:37:42,048] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. + 7: [2023-05-10 12:37:42,049] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... + 7: [2023-05-10 12:37:42,049] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. + 7: [2023-05-10 12:37:42,049] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... + 7: [2023-05-10 12:37:42,049] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... + 7: [2023-05-10 12:37:42,060] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. + 6: [2023-05-10 12:37:42,060] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt. + 6: [2023-05-10 12:37:42,061] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt. + 6: [2023-05-10 12:37:42,061] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt. + 6: [2023-05-10 12:37:42,061] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt. + 7: [2023-05-10 12:37:42,068] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. + 7: [2023-05-10 12:37:42,068] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. + 7: [2023-05-10 12:37:42,068] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. + 6: [2023-05-10 12:37:42,070] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... + 6: [2023-05-10 12:37:42,071] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +14: [2023-05-10 12:37:42,071] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt. + 6: [2023-05-10 12:37:42,071] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +14: [2023-05-10 12:37:42,071] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt. + 7: [2023-05-10 12:37:42,071] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... + 6: [2023-05-10 12:37:42,071] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +14: [2023-05-10 12:37:42,072] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt. +14: [2023-05-10 12:37:42,072] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt. + 7: [2023-05-10 12:37:42,077] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... + 7: [2023-05-10 12:37:42,078] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... + 7: [2023-05-10 12:37:42,078] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +14: [2023-05-10 12:37:42,081] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +14: [2023-05-10 12:37:42,081] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +14: [2023-05-10 12:37:42,081] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +14: [2023-05-10 12:37:42,082] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +20: [2023-05-10 12:37:42,085] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt. +24: [2023-05-10 12:37:42,085] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt. +20: [2023-05-10 12:37:42,085] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt. +20: [2023-05-10 12:37:42,085] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt. +24: [2023-05-10 12:37:42,085] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt. +26: [2023-05-10 12:37:42,085] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt. +24: [2023-05-10 12:37:42,085] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt. +26: [2023-05-10 12:37:42,085] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt. +26: [2023-05-10 12:37:42,085] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt. +24: [2023-05-10 12:37:42,085] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt. +20: [2023-05-10 12:37:42,085] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt. +26: [2023-05-10 12:37:42,085] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt. +25: [2023-05-10 12:37:42,091] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +25: [2023-05-10 12:37:42,091] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +25: [2023-05-10 12:37:42,091] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +25: [2023-05-10 12:37:42,091] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +25: [2023-05-10 12:37:42,091] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +25: [2023-05-10 12:37:42,091] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +25: [2023-05-10 12:37:42,091] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +25: [2023-05-10 12:37:42,091] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +24: [2023-05-10 12:37:42,094] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +24: [2023-05-10 12:37:42,094] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +20: [2023-05-10 12:37:42,095] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +20: [2023-05-10 12:37:42,095] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +20: [2023-05-10 12:37:42,095] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +24: [2023-05-10 12:37:42,095] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +20: [2023-05-10 12:37:42,096] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +26: [2023-05-10 12:37:42,096] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +24: [2023-05-10 12:37:42,096] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +26: [2023-05-10 12:37:42,096] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +26: [2023-05-10 12:37:42,097] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +26: [2023-05-10 12:37:42,097] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +31: [2023-05-10 12:37:42,101] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt. +31: [2023-05-10 12:37:42,101] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt. +31: [2023-05-10 12:37:42,101] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt. +31: [2023-05-10 12:37:42,101] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt. +25: [2023-05-10 12:37:42,102] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +25: [2023-05-10 12:37:42,103] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +20: [2023-05-10 12:37:42,107] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +25: [2023-05-10 12:37:42,107] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +25: [2023-05-10 12:37:42,108] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +26: [2023-05-10 12:37:42,108] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +26: [2023-05-10 12:37:42,109] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt... +20: [2023-05-10 12:37:42,109] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt... +20: [2023-05-10 12:37:42,110] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +20: [2023-05-10 12:37:42,110] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt... +31: [2023-05-10 12:37:42,110] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +24: [2023-05-10 12:37:42,110] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +24: [2023-05-10 12:37:42,110] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +24: [2023-05-10 12:37:42,111] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt... +24: [2023-05-10 12:37:42,111] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt... +31: [2023-05-10 12:37:42,111] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +31: [2023-05-10 12:37:42,111] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +31: [2023-05-10 12:37:42,112] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +25: [2023-05-10 12:37:42,112] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +24: [2023-05-10 12:37:42,112] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +24: [2023-05-10 12:37:42,112] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt... +26: [2023-05-10 12:37:42,113] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +26: [2023-05-10 12:37:42,114] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt... +25: [2023-05-10 12:37:42,114] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +24: [2023-05-10 12:37:42,115] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +24: [2023-05-10 12:37:42,115] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt... +20: [2023-05-10 12:37:42,116] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +20: [2023-05-10 12:37:42,116] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt... +26: [2023-05-10 12:37:42,116] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +26: [2023-05-10 12:37:42,116] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +26: [2023-05-10 12:37:42,117] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt... +26: [2023-05-10 12:37:42,117] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt... +25: [2023-05-10 12:37:42,117] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +25: [2023-05-10 12:37:42,119] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +20: [2023-05-10 12:37:42,122] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +29: [2023-05-10 12:37:42,123] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +29: [2023-05-10 12:37:42,123] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +29: [2023-05-10 12:37:42,123] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +29: [2023-05-10 12:37:42,123] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +29: [2023-05-10 12:37:42,123] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +29: [2023-05-10 12:37:42,123] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +29: [2023-05-10 12:37:42,124] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +20: [2023-05-10 12:37:42,124] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt... +29: [2023-05-10 12:37:42,125] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +31: [2023-05-10 12:37:42,126] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +31: [2023-05-10 12:37:42,126] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +31: [2023-05-10 12:37:42,126] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +31: [2023-05-10 12:37:42,126] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +31: [2023-05-10 12:37:42,127] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +31: [2023-05-10 12:37:42,127] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +28: [2023-05-10 12:37:42,127] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +28: [2023-05-10 12:37:42,127] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +31: [2023-05-10 12:37:42,127] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +31: [2023-05-10 12:37:42,127] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +28: [2023-05-10 12:37:42,127] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +28: [2023-05-10 12:37:42,127] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +28: [2023-05-10 12:37:42,128] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +28: [2023-05-10 12:37:42,128] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +31: [2023-05-10 12:37:42,128] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt... +31: [2023-05-10 12:37:42,128] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt... +31: [2023-05-10 12:37:42,128] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +31: [2023-05-10 12:37:42,128] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +28: [2023-05-10 12:37:42,129] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +28: [2023-05-10 12:37:42,130] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +29: [2023-05-10 12:37:42,135] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +31: [2023-05-10 12:37:42,135] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +31: [2023-05-10 12:37:42,135] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +31: [2023-05-10 12:37:42,135] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt... +31: [2023-05-10 12:37:42,135] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt... +29: [2023-05-10 12:37:42,139] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +29: [2023-05-10 12:37:42,139] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +28: [2023-05-10 12:37:42,139] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +31: [2023-05-10 12:37:42,139] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. + 4: [2023-05-10 12:37:42,140] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. + 4: [2023-05-10 12:37:42,140] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. + 4: [2023-05-10 12:37:42,140] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. + 4: [2023-05-10 12:37:42,141] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... + 4: [2023-05-10 12:37:42,141] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... + 4: [2023-05-10 12:37:42,141] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +31: [2023-05-10 12:37:42,141] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. + 4: [2023-05-10 12:37:42,141] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +31: [2023-05-10 12:37:42,141] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. + 3: [2023-05-10 12:37:42,141] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. + 3: [2023-05-10 12:37:42,141] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... + 3: [2023-05-10 12:37:42,141] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. + 3: [2023-05-10 12:37:42,141] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. + 3: [2023-05-10 12:37:42,141] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... + 3: [2023-05-10 12:37:42,141] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... + 3: [2023-05-10 12:37:42,142] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. + 3: [2023-05-10 12:37:42,142] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... + 4: [2023-05-10 12:37:42,143] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +28: [2023-05-10 12:37:42,143] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +24: [2023-05-10 12:37:42,144] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +24: [2023-05-10 12:37:42,144] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +24: [2023-05-10 12:37:42,144] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +24: [2023-05-10 12:37:42,144] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +24: [2023-05-10 12:37:42,144] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +24: [2023-05-10 12:37:42,144] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +24: [2023-05-10 12:37:42,144] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +24: [2023-05-10 12:37:42,144] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +29: [2023-05-10 12:37:42,147] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +31: [2023-05-10 12:37:42,148] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +29: [2023-05-10 12:37:42,148] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +31: [2023-05-10 12:37:42,149] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +29: [2023-05-10 12:37:42,149] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +28: [2023-05-10 12:37:42,149] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt. +28: [2023-05-10 12:37:42,149] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt. +28: [2023-05-10 12:37:42,149] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt. +28: [2023-05-10 12:37:42,150] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt. +28: [2023-05-10 12:37:42,150] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +31: [2023-05-10 12:37:42,150] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +10: [2023-05-10 12:37:42,151] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +10: [2023-05-10 12:37:42,151] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +10: [2023-05-10 12:37:42,151] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +10: [2023-05-10 12:37:42,151] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +10: [2023-05-10 12:37:42,151] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +31: [2023-05-10 12:37:42,151] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +19: [2023-05-10 12:37:42,152] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +19: [2023-05-10 12:37:42,152] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +19: [2023-05-10 12:37:42,152] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +19: [2023-05-10 12:37:42,152] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +19: [2023-05-10 12:37:42,152] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +19: [2023-05-10 12:37:42,152] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +19: [2023-05-10 12:37:42,152] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +19: [2023-05-10 12:37:42,152] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +19: [2023-05-10 12:37:42,152] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +19: [2023-05-10 12:37:42,152] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +19: [2023-05-10 12:37:42,152] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... + 3: [2023-05-10 12:37:42,152] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +19: [2023-05-10 12:37:42,152] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +10: [2023-05-10 12:37:42,152] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +10: [2023-05-10 12:37:42,152] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. + 4: [2023-05-10 12:37:42,152] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +10: [2023-05-10 12:37:42,152] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +19: [2023-05-10 12:37:42,152] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt... +19: [2023-05-10 12:37:42,152] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt... +19: [2023-05-10 12:37:42,152] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt... +19: [2023-05-10 12:37:42,152] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt... +29: [2023-05-10 12:37:42,153] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... + 4: [2023-05-10 12:37:42,156] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +31: [2023-05-10 12:37:42,157] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +24: [2023-05-10 12:37:42,157] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. + 4: [2023-05-10 12:37:42,157] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +29: [2023-05-10 12:37:42,157] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +24: [2023-05-10 12:37:42,157] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +28: [2023-05-10 12:37:42,158] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +24: [2023-05-10 12:37:42,158] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. + 9: [2023-05-10 12:37:42,159] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. + 9: [2023-05-10 12:37:42,159] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +28: [2023-05-10 12:37:42,159] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... + 9: [2023-05-10 12:37:42,159] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... + 9: [2023-05-10 12:37:42,159] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... + 9: [2023-05-10 12:37:42,159] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +28: [2023-05-10 12:37:42,159] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +28: [2023-05-10 12:37:42,159] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... + 9: [2023-05-10 12:37:42,159] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. + 3: [2023-05-10 12:37:42,160] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... + 3: [2023-05-10 12:37:42,160] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. + 3: [2023-05-10 12:37:42,160] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. + 9: [2023-05-10 12:37:42,161] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... + 3: [2023-05-10 12:37:42,161] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. + 9: [2023-05-10 12:37:42,161] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +30: [2023-05-10 12:37:42,161] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +30: [2023-05-10 12:37:42,161] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +30: [2023-05-10 12:37:42,161] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +30: [2023-05-10 12:37:42,162] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +30: [2023-05-10 12:37:42,161] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +30: [2023-05-10 12:37:42,162] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +28: [2023-05-10 12:37:42,162] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +28: [2023-05-10 12:37:42,162] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +30: [2023-05-10 12:37:42,162] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... + 4: [2023-05-10 12:37:42,162] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +17: [2023-05-10 12:37:42,162] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +17: [2023-05-10 12:37:42,162] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +17: [2023-05-10 12:37:42,162] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... + 6: [2023-05-10 12:37:42,162] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. + 6: [2023-05-10 12:37:42,163] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. + 6: [2023-05-10 12:37:42,163] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. + 6: [2023-05-10 12:37:42,163] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. + 6: [2023-05-10 12:37:42,163] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. + 6: [2023-05-10 12:37:42,163] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt... + 6: [2023-05-10 12:37:42,163] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. + 6: [2023-05-10 12:37:42,163] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. + 6: [2023-05-10 12:37:42,163] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... + 6: [2023-05-10 12:37:42,163] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt... + 6: [2023-05-10 12:37:42,163] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt... + 6: [2023-05-10 12:37:42,163] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +30: [2023-05-10 12:37:42,163] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +17: [2023-05-10 12:37:42,164] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +19: [2023-05-10 12:37:42,163] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. + 6: [2023-05-10 12:37:42,164] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... + 6: [2023-05-10 12:37:42,164] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... + 6: [2023-05-10 12:37:42,165] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt... +17: [2023-05-10 12:37:42,165] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +17: [2023-05-10 12:37:42,165] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +19: [2023-05-10 12:37:42,165] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. + 6: [2023-05-10 12:37:42,165] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +24: [2023-05-10 12:37:42,166] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +17: [2023-05-10 12:37:42,166] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +17: [2023-05-10 12:37:42,166] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +24: [2023-05-10 12:37:42,166] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +26: [2023-05-10 12:37:42,166] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +26: [2023-05-10 12:37:42,166] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +26: [2023-05-10 12:37:42,166] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +26: [2023-05-10 12:37:42,166] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... + 4: [2023-05-10 12:37:42,167] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +10: [2023-05-10 12:37:42,167] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +18: [2023-05-10 12:37:42,167] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +18: [2023-05-10 12:37:42,167] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +18: [2023-05-10 12:37:42,167] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +18: [2023-05-10 12:37:42,167] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +18: [2023-05-10 12:37:42,167] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +18: [2023-05-10 12:37:42,167] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +18: [2023-05-10 12:37:42,167] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +18: [2023-05-10 12:37:42,167] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +26: [2023-05-10 12:37:42,168] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +26: [2023-05-10 12:37:42,168] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +26: [2023-05-10 12:37:42,168] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +26: [2023-05-10 12:37:42,168] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +24: [2023-05-10 12:37:42,168] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... + 4: [2023-05-10 12:37:42,169] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +19: [2023-05-10 12:37:42,169] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +19: [2023-05-10 12:37:42,169] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +28: [2023-05-10 12:37:42,169] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +24: [2023-05-10 12:37:42,169] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +10: [2023-05-10 12:37:42,169] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. + 3: [2023-05-10 12:37:42,170] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... + 9: [2023-05-10 12:37:42,171] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +28: [2023-05-10 12:37:42,172] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... + 9: [2023-05-10 12:37:42,172] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +10: [2023-05-10 12:37:42,172] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +19: [2023-05-10 12:37:42,172] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +22: [2023-05-10 12:37:42,174] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. + 3: [2023-05-10 12:37:42,174] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... + 3: [2023-05-10 12:37:42,174] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +22: [2023-05-10 12:37:42,174] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt... +22: [2023-05-10 12:37:42,174] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +22: [2023-05-10 12:37:42,175] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt... +22: [2023-05-10 12:37:42,175] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +22: [2023-05-10 12:37:42,175] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +19: [2023-05-10 12:37:42,175] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +10: [2023-05-10 12:37:42,175] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +22: [2023-05-10 12:37:42,175] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +22: [2023-05-10 12:37:42,175] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +24: [2023-05-10 12:37:42,175] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +22: [2023-05-10 12:37:42,175] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +22: [2023-05-10 12:37:42,175] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt... +22: [2023-05-10 12:37:42,175] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt... +28: [2023-05-10 12:37:42,175] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +22: [2023-05-10 12:37:42,175] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +28: [2023-05-10 12:37:42,176] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +28: [2023-05-10 12:37:42,176] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt... +28: [2023-05-10 12:37:42,176] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt... +17: [2023-05-10 12:37:42,176] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +22: [2023-05-10 12:37:42,177] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +22: [2023-05-10 12:37:42,177] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +22: [2023-05-10 12:37:42,177] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... + 6: [2023-05-10 12:37:42,177] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +26: [2023-05-10 12:37:42,177] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +19: [2023-05-10 12:37:42,177] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +30: [2023-05-10 12:37:42,177] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. + 4: [2023-05-10 12:37:42,178] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +30: [2023-05-10 12:37:42,178] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +28: [2023-05-10 12:37:42,179] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +28: [2023-05-10 12:37:42,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt... +28: [2023-05-10 12:37:42,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +10: [2023-05-10 12:37:42,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +19: [2023-05-10 12:37:42,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +22: [2023-05-10 12:37:42,180] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +26: [2023-05-10 12:37:42,180] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +23: [2023-05-10 12:37:42,181] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +23: [2023-05-10 12:37:42,181] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +23: [2023-05-10 12:37:42,181] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +23: [2023-05-10 12:37:42,182] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +23: [2023-05-10 12:37:42,181] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +23: [2023-05-10 12:37:42,182] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +23: [2023-05-10 12:37:42,182] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +23: [2023-05-10 12:37:42,182] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... + 9: [2023-05-10 12:37:42,183] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +26: [2023-05-10 12:37:42,183] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +10: [2023-05-10 12:37:42,184] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +10: [2023-05-10 12:37:42,184] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. + 9: [2023-05-10 12:37:42,185] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... + 6: [2023-05-10 12:37:42,186] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... + 6: [2023-05-10 12:37:42,186] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +26: [2023-05-10 12:37:42,186] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +17: [2023-05-10 12:37:42,186] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... + 4: [2023-05-10 12:37:42,186] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... + 9: [2023-05-10 12:37:42,187] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +30: [2023-05-10 12:37:42,187] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +30: [2023-05-10 12:37:42,187] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +30: [2023-05-10 12:37:42,187] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +22: [2023-05-10 12:37:42,188] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +17: [2023-05-10 12:37:42,188] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. + 9: [2023-05-10 12:37:42,188] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +17: [2023-05-10 12:37:42,189] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +26: [2023-05-10 12:37:42,189] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +26: [2023-05-10 12:37:42,189] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +28: [2023-05-10 12:37:42,190] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +18: [2023-05-10 12:37:42,190] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +18: [2023-05-10 12:37:42,190] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +18: [2023-05-10 12:37:42,190] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +18: [2023-05-10 12:37:42,190] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +28: [2023-05-10 12:37:42,191] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt... +30: [2023-05-10 12:37:42,191] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. + 6: [2023-05-10 12:37:42,192] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +17: [2023-05-10 12:37:42,192] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +23: [2023-05-10 12:37:42,193] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +10: [2023-05-10 12:37:42,193] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +23: [2023-05-10 12:37:42,194] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. + 6: [2023-05-10 12:37:42,195] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +22: [2023-05-10 12:37:42,195] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +22: [2023-05-10 12:37:42,195] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. + 9: [2023-05-10 12:37:42,196] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +23: [2023-05-10 12:37:42,196] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +30: [2023-05-10 12:37:42,197] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +17: [2023-05-10 12:37:42,197] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +23: [2023-05-10 12:37:42,197] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +26: [2023-05-10 12:37:42,197] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... + 9: [2023-05-10 12:37:42,198] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... + 6: [2023-05-10 12:37:42,199] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +17: [2023-05-10 12:37:42,199] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +30: [2023-05-10 12:37:42,200] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... + 6: [2023-05-10 12:37:42,200] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +26: [2023-05-10 12:37:42,201] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +18: [2023-05-10 12:37:42,201] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +17: [2023-05-10 12:37:42,201] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +18: [2023-05-10 12:37:42,202] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +18: [2023-05-10 12:37:42,202] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +23: [2023-05-10 12:37:42,202] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +23: [2023-05-10 12:37:42,202] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +18: [2023-05-10 12:37:42,203] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... + 1: [2023-05-10 12:37:42,205] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. + 7: [2023-05-10 12:37:42,205] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. + 1: [2023-05-10 12:37:42,205] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. + 7: [2023-05-10 12:37:42,205] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... + 1: [2023-05-10 12:37:42,205] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... + 1: [2023-05-10 12:37:42,205] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... + 1: [2023-05-10 12:37:42,205] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. + 7: [2023-05-10 12:37:42,206] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. + 7: [2023-05-10 12:37:42,206] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. + 1: [2023-05-10 12:37:42,206] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... + 1: [2023-05-10 12:37:42,206] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. + 7: [2023-05-10 12:37:42,206] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. + 7: [2023-05-10 12:37:42,206] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... + 1: [2023-05-10 12:37:42,206] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... + 7: [2023-05-10 12:37:42,206] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... + 7: [2023-05-10 12:37:42,206] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... + 6: [2023-05-10 12:37:42,208] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +23: [2023-05-10 12:37:42,208] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... + 1: [2023-05-10 12:37:42,209] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt. + 1: [2023-05-10 12:37:42,209] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt. +23: [2023-05-10 12:37:42,209] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +22: [2023-05-10 12:37:42,209] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +22: [2023-05-10 12:37:42,210] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... + 1: [2023-05-10 12:37:42,211] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt. + 1: [2023-05-10 12:37:42,211] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt. +22: [2023-05-10 12:37:42,211] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +22: [2023-05-10 12:37:42,215] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. + 7: [2023-05-10 12:37:42,216] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. + 1: [2023-05-10 12:37:42,218] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... + 1: [2023-05-10 12:37:42,218] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... + 1: [2023-05-10 12:37:42,222] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... + 1: [2023-05-10 12:37:42,223] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. + 1: [2023-05-10 12:37:42,223] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. + 7: [2023-05-10 12:37:42,225] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. + 7: [2023-05-10 12:37:42,225] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. + 7: [2023-05-10 12:37:42,225] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... + 7: [2023-05-10 12:37:42,225] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +13: [2023-05-10 12:37:42,225] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +13: [2023-05-10 12:37:42,226] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +13: [2023-05-10 12:37:42,226] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +13: [2023-05-10 12:37:42,226] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +13: [2023-05-10 12:37:42,226] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +13: [2023-05-10 12:37:42,226] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +13: [2023-05-10 12:37:42,226] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... + 1: [2023-05-10 12:37:42,226] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +13: [2023-05-10 12:37:42,226] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +22: [2023-05-10 12:37:42,226] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... + 1: [2023-05-10 12:37:42,230] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. + 1: [2023-05-10 12:37:42,230] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. + 1: [2023-05-10 12:37:42,233] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... + 1: [2023-05-10 12:37:42,233] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +25: [2023-05-10 12:37:42,234] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +25: [2023-05-10 12:37:42,235] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +25: [2023-05-10 12:37:42,235] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. + 7: [2023-05-10 12:37:42,235] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... + 7: [2023-05-10 12:37:42,235] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +25: [2023-05-10 12:37:42,235] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +25: [2023-05-10 12:37:42,235] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +25: [2023-05-10 12:37:42,235] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +26: [2023-05-10 12:37:42,235] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt. +25: [2023-05-10 12:37:42,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +26: [2023-05-10 12:37:42,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt. +26: [2023-05-10 12:37:42,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt. + 7: [2023-05-10 12:37:42,236] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... + 1: [2023-05-10 12:37:42,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. + 1: [2023-05-10 12:37:42,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. + 1: [2023-05-10 12:37:42,236] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt... + 1: [2023-05-10 12:37:42,236] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt... +13: [2023-05-10 12:37:42,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +26: [2023-05-10 12:37:42,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt. +25: [2023-05-10 12:37:42,237] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +20: [2023-05-10 12:37:42,238] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt. +20: [2023-05-10 12:37:42,239] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt. +20: [2023-05-10 12:37:42,239] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt. +20: [2023-05-10 12:37:42,239] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt. + 1: [2023-05-10 12:37:42,242] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +13: [2023-05-10 12:37:42,245] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... + 1: [2023-05-10 12:37:42,245] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +13: [2023-05-10 12:37:42,246] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +13: [2023-05-10 12:37:42,246] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +26: [2023-05-10 12:37:42,247] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +26: [2023-05-10 12:37:42,247] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +13: [2023-05-10 12:37:42,247] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +25: [2023-05-10 12:37:42,248] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +26: [2023-05-10 12:37:42,248] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +20: [2023-05-10 12:37:42,248] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +24: [2023-05-10 12:37:42,248] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt. +24: [2023-05-10 12:37:42,248] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt. +26: [2023-05-10 12:37:42,248] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +24: [2023-05-10 12:37:42,248] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt. +25: [2023-05-10 12:37:42,248] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +24: [2023-05-10 12:37:42,248] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt. + 1: [2023-05-10 12:37:42,249] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. + 1: [2023-05-10 12:37:42,249] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt... +20: [2023-05-10 12:37:42,249] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +20: [2023-05-10 12:37:42,250] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +25: [2023-05-10 12:37:42,252] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +20: [2023-05-10 12:37:42,252] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +29: [2023-05-10 12:37:42,254] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt. +29: [2023-05-10 12:37:42,255] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt. +29: [2023-05-10 12:37:42,255] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt. +29: [2023-05-10 12:37:42,255] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt. + 1: [2023-05-10 12:37:42,256] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. + 1: [2023-05-10 12:37:42,256] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt... +13: [2023-05-10 12:37:42,256] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +24: [2023-05-10 12:37:42,257] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +24: [2023-05-10 12:37:42,258] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +13: [2023-05-10 12:37:42,258] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +24: [2023-05-10 12:37:42,258] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +13: [2023-05-10 12:37:42,259] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +24: [2023-05-10 12:37:42,260] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +25: [2023-05-10 12:37:42,261] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +25: [2023-05-10 12:37:42,261] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +25: [2023-05-10 12:37:42,264] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +29: [2023-05-10 12:37:42,264] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +29: [2023-05-10 12:37:42,265] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +29: [2023-05-10 12:37:42,265] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +29: [2023-05-10 12:37:42,265] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +20: [2023-05-10 12:37:42,266] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +20: [2023-05-10 12:37:42,266] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt... +26: [2023-05-10 12:37:42,266] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +26: [2023-05-10 12:37:42,266] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +26: [2023-05-10 12:37:42,267] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt... +26: [2023-05-10 12:37:42,267] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt... + 0: [2023-05-10 12:37:42,267] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. + 0: [2023-05-10 12:37:42,267] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. + 0: [2023-05-10 12:37:42,267] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... + 0: [2023-05-10 12:37:42,267] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... + 0: [2023-05-10 12:37:42,267] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. + 0: [2023-05-10 12:37:42,267] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. + 0: [2023-05-10 12:37:42,267] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... + 0: [2023-05-10 12:37:42,267] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... + 8: [2023-05-10 12:37:42,267] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt. + 8: [2023-05-10 12:37:42,267] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt. + 8: [2023-05-10 12:37:42,268] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt. +21: [2023-05-10 12:37:42,268] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +21: [2023-05-10 12:37:42,268] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +21: [2023-05-10 12:37:42,268] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +21: [2023-05-10 12:37:42,268] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... + 8: [2023-05-10 12:37:42,269] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt. +21: [2023-05-10 12:37:42,269] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +21: [2023-05-10 12:37:42,269] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +21: [2023-05-10 12:37:42,269] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +21: [2023-05-10 12:37:42,269] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +20: [2023-05-10 12:37:42,269] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +31: [2023-05-10 12:37:42,270] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +14: [2023-05-10 12:37:42,270] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +25: [2023-05-10 12:37:42,270] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +31: [2023-05-10 12:37:42,270] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +31: [2023-05-10 12:37:42,270] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +14: [2023-05-10 12:37:42,270] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +14: [2023-05-10 12:37:42,270] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +14: [2023-05-10 12:37:42,270] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +14: [2023-05-10 12:37:42,270] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +14: [2023-05-10 12:37:42,270] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +31: [2023-05-10 12:37:42,270] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +14: [2023-05-10 12:37:42,270] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +14: [2023-05-10 12:37:42,270] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +14: [2023-05-10 12:37:42,270] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +14: [2023-05-10 12:37:42,270] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +14: [2023-05-10 12:37:42,270] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +14: [2023-05-10 12:37:42,270] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +14: [2023-05-10 12:37:42,270] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt... +14: [2023-05-10 12:37:42,270] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt... +14: [2023-05-10 12:37:42,270] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt... +14: [2023-05-10 12:37:42,270] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt... +20: [2023-05-10 12:37:42,271] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt... +31: [2023-05-10 12:37:42,272] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +31: [2023-05-10 12:37:42,272] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +31: [2023-05-10 12:37:42,272] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +24: [2023-05-10 12:37:42,272] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +24: [2023-05-10 12:37:42,272] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +24: [2023-05-10 12:37:42,273] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt... +24: [2023-05-10 12:37:42,273] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt... +31: [2023-05-10 12:37:42,274] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +24: [2023-05-10 12:37:42,274] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +24: [2023-05-10 12:37:42,274] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt... +20: [2023-05-10 12:37:42,275] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +26: [2023-05-10 12:37:42,275] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +26: [2023-05-10 12:37:42,275] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +20: [2023-05-10 12:37:42,276] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +20: [2023-05-10 12:37:42,276] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +29: [2023-05-10 12:37:42,276] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +20: [2023-05-10 12:37:42,276] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +20: [2023-05-10 12:37:42,276] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +29: [2023-05-10 12:37:42,276] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt... +26: [2023-05-10 12:37:42,277] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt... +15: [2023-05-10 12:37:42,277] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +15: [2023-05-10 12:37:42,277] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +20: [2023-05-10 12:37:42,277] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt... +26: [2023-05-10 12:37:42,277] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt... +15: [2023-05-10 12:37:42,277] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +15: [2023-05-10 12:37:42,277] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +15: [2023-05-10 12:37:42,277] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... + 8: [2023-05-10 12:37:42,277] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +15: [2023-05-10 12:37:42,277] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +15: [2023-05-10 12:37:42,277] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +20: [2023-05-10 12:37:42,277] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +20: [2023-05-10 12:37:42,277] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +20: [2023-05-10 12:37:42,277] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +25: [2023-05-10 12:37:42,278] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +15: [2023-05-10 12:37:42,278] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... + 8: [2023-05-10 12:37:42,279] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... + 2: [2023-05-10 12:37:42,279] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. + 2: [2023-05-10 12:37:42,279] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... + 2: [2023-05-10 12:37:42,279] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. + 2: [2023-05-10 12:37:42,279] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +20: [2023-05-10 12:37:42,279] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +20: [2023-05-10 12:37:42,279] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +20: [2023-05-10 12:37:42,280] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt... + 2: [2023-05-10 12:37:42,280] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. + 2: [2023-05-10 12:37:42,280] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. + 2: [2023-05-10 12:37:42,280] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... + 8: [2023-05-10 12:37:42,281] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +11: [2023-05-10 12:37:42,281] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +11: [2023-05-10 12:37:42,281] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +11: [2023-05-10 12:37:42,281] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +11: [2023-05-10 12:37:42,281] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... + 8: [2023-05-10 12:37:42,281] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +31: [2023-05-10 12:37:42,281] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +11: [2023-05-10 12:37:42,282] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +11: [2023-05-10 12:37:42,282] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +21: [2023-05-10 12:37:42,282] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. + 2: [2023-05-10 12:37:42,282] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +14: [2023-05-10 12:37:42,282] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +29: [2023-05-10 12:37:42,282] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +29: [2023-05-10 12:37:42,282] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt... +29: [2023-05-10 12:37:42,282] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +29: [2023-05-10 12:37:42,283] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt... +29: [2023-05-10 12:37:42,283] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +11: [2023-05-10 12:37:42,283] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +31: [2023-05-10 12:37:42,283] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +11: [2023-05-10 12:37:42,283] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +21: [2023-05-10 12:37:42,284] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +29: [2023-05-10 12:37:42,284] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt... +16: [2023-05-10 12:37:42,284] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +16: [2023-05-10 12:37:42,284] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +16: [2023-05-10 12:37:42,284] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +16: [2023-05-10 12:37:42,284] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +16: [2023-05-10 12:37:42,284] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +21: [2023-05-10 12:37:42,285] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +16: [2023-05-10 12:37:42,284] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +16: [2023-05-10 12:37:42,285] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +24: [2023-05-10 12:37:42,285] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +31: [2023-05-10 12:37:42,285] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +21: [2023-05-10 12:37:42,285] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +14: [2023-05-10 12:37:42,285] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +14: [2023-05-10 12:37:42,285] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +12: [2023-05-10 12:37:42,286] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +12: [2023-05-10 12:37:42,286] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +16: [2023-05-10 12:37:42,285] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +12: [2023-05-10 12:37:42,286] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +12: [2023-05-10 12:37:42,286] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +12: [2023-05-10 12:37:42,286] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +12: [2023-05-10 12:37:42,286] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +24: [2023-05-10 12:37:42,286] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt... + 5: [2023-05-10 12:37:42,286] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. + 5: [2023-05-10 12:37:42,286] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. + 5: [2023-05-10 12:37:42,286] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... + 5: [2023-05-10 12:37:42,286] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... + 5: [2023-05-10 12:37:42,286] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. + 5: [2023-05-10 12:37:42,286] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. + 5: [2023-05-10 12:37:42,287] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... + 5: [2023-05-10 12:37:42,287] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +12: [2023-05-10 12:37:42,287] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +12: [2023-05-10 12:37:42,288] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +27: [2023-05-10 12:37:42,288] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +27: [2023-05-10 12:37:42,288] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... + 8: [2023-05-10 12:37:42,289] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. + 8: [2023-05-10 12:37:42,289] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. + 8: [2023-05-10 12:37:42,289] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... + 8: [2023-05-10 12:37:42,289] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +14: [2023-05-10 12:37:42,289] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +27: [2023-05-10 12:37:42,289] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +27: [2023-05-10 12:37:42,290] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... + 8: [2023-05-10 12:37:42,290] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +20: [2023-05-10 12:37:42,289] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. + 8: [2023-05-10 12:37:42,290] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +20: [2023-05-10 12:37:42,290] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +31: [2023-05-10 12:37:42,290] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... + 8: [2023-05-10 12:37:42,290] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... + 5: [2023-05-10 12:37:42,291] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt. + 5: [2023-05-10 12:37:42,291] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt. +27: [2023-05-10 12:37:42,291] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +27: [2023-05-10 12:37:42,291] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. + 2: [2023-05-10 12:37:42,291] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +21: [2023-05-10 12:37:42,292] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... + 5: [2023-05-10 12:37:42,292] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt. + 8: [2023-05-10 12:37:42,292] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +27: [2023-05-10 12:37:42,293] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +27: [2023-05-10 12:37:42,293] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... + 5: [2023-05-10 12:37:42,293] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt. + 0: [2023-05-10 12:37:42,293] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. + 0: [2023-05-10 12:37:42,293] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +31: [2023-05-10 12:37:42,293] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... + 8: [2023-05-10 12:37:42,293] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. + 0: [2023-05-10 12:37:42,294] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +14: [2023-05-10 12:37:42,294] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +31: [2023-05-10 12:37:42,294] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... + 0: [2023-05-10 12:37:42,294] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. + 8: [2023-05-10 12:37:42,294] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt... +11: [2023-05-10 12:37:42,294] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +14: [2023-05-10 12:37:42,295] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +14: [2023-05-10 12:37:42,295] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +16: [2023-05-10 12:37:42,295] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. + 2: [2023-05-10 12:37:42,295] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. + 2: [2023-05-10 12:37:42,295] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +21: [2023-05-10 12:37:42,296] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +21: [2023-05-10 12:37:42,296] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +11: [2023-05-10 12:37:42,296] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +15: [2023-05-10 12:37:42,297] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +16: [2023-05-10 12:37:42,297] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +15: [2023-05-10 12:37:42,298] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +15: [2023-05-10 12:37:42,298] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +21: [2023-05-10 12:37:42,298] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +20: [2023-05-10 12:37:42,298] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +14: [2023-05-10 12:37:42,299] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +20: [2023-05-10 12:37:42,299] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +27: [2023-05-10 12:37:42,300] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +12: [2023-05-10 12:37:42,301] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +15: [2023-05-10 12:37:42,301] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +12: [2023-05-10 12:37:42,302] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +12: [2023-05-10 12:37:42,302] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +16: [2023-05-10 12:37:42,302] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +27: [2023-05-10 12:37:42,302] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. + 5: [2023-05-10 12:37:42,303] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. + 5: [2023-05-10 12:37:42,303] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. + 2: [2023-05-10 12:37:42,303] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... + 5: [2023-05-10 12:37:42,304] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... + 0: [2023-05-10 12:37:42,304] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... + 5: [2023-05-10 12:37:42,304] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... + 0: [2023-05-10 12:37:42,304] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +31: [2023-05-10 12:37:42,305] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +11: [2023-05-10 12:37:42,305] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... + 8: [2023-05-10 12:37:42,305] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +11: [2023-05-10 12:37:42,306] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt. +11: [2023-05-10 12:37:42,306] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt. + 8: [2023-05-10 12:37:42,306] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. + 0: [2023-05-10 12:37:42,306] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +20: [2023-05-10 12:37:42,306] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +16: [2023-05-10 12:37:42,307] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... + 5: [2023-05-10 12:37:42,307] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +11: [2023-05-10 12:37:42,307] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... + 2: [2023-05-10 12:37:42,307] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... + 8: [2023-05-10 12:37:42,307] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt... + 2: [2023-05-10 12:37:42,307] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +15: [2023-05-10 12:37:42,307] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +15: [2023-05-10 12:37:42,308] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +16: [2023-05-10 12:37:42,308] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +15: [2023-05-10 12:37:42,308] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... + 0: [2023-05-10 12:37:42,309] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... + 2: [2023-05-10 12:37:42,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +27: [2023-05-10 12:37:42,310] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +15: [2023-05-10 12:37:42,310] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +20: [2023-05-10 12:37:42,310] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +12: [2023-05-10 12:37:42,312] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... + 5: [2023-05-10 12:37:42,312] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +11: [2023-05-10 12:37:42,312] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt. +12: [2023-05-10 12:37:42,312] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +27: [2023-05-10 12:37:42,312] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... + 5: [2023-05-10 12:37:42,312] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +31: [2023-05-10 12:37:42,313] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +16: [2023-05-10 12:37:42,313] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +11: [2023-05-10 12:37:42,313] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt. + 8: [2023-05-10 12:37:42,313] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. + 8: [2023-05-10 12:37:42,313] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. + 8: [2023-05-10 12:37:42,313] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... + 5: [2023-05-10 12:37:42,313] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +11: [2023-05-10 12:37:42,314] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. + 5: [2023-05-10 12:37:42,314] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +12: [2023-05-10 12:37:42,315] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +16: [2023-05-10 12:37:42,315] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +20: [2023-05-10 12:37:42,315] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +12: [2023-05-10 12:37:42,316] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +11: [2023-05-10 12:37:42,316] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +11: [2023-05-10 12:37:42,317] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +30: [2023-05-10 12:37:42,317] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt. +27: [2023-05-10 12:37:42,317] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +30: [2023-05-10 12:37:42,317] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt. +30: [2023-05-10 12:37:42,317] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt. + 5: [2023-05-10 12:37:42,317] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +30: [2023-05-10 12:37:42,318] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt. +27: [2023-05-10 12:37:42,318] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +20: [2023-05-10 12:37:42,320] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... + 5: [2023-05-10 12:37:42,320] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt... + 8: [2023-05-10 12:37:42,320] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. + 8: [2023-05-10 12:37:42,320] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. + 2: [2023-05-10 12:37:42,321] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +11: [2023-05-10 12:37:42,321] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +11: [2023-05-10 12:37:42,322] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. + 8: [2023-05-10 12:37:42,323] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt... + 8: [2023-05-10 12:37:42,323] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +16: [2023-05-10 12:37:42,323] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... + 8: [2023-05-10 12:37:42,324] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt... +11: [2023-05-10 12:37:42,324] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +11: [2023-05-10 12:37:42,325] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +12: [2023-05-10 12:37:42,325] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +30: [2023-05-10 12:37:42,327] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... + 5: [2023-05-10 12:37:42,327] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +27: [2023-05-10 12:37:42,327] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +27: [2023-05-10 12:37:42,327] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +30: [2023-05-10 12:37:42,327] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... + 5: [2023-05-10 12:37:42,327] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... + 5: [2023-05-10 12:37:42,328] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. + 5: [2023-05-10 12:37:42,328] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt... + 8: [2023-05-10 12:37:42,328] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +30: [2023-05-10 12:37:42,328] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +30: [2023-05-10 12:37:42,331] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... + 8: [2023-05-10 12:37:42,332] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +21: [2023-05-10 12:37:42,332] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt. +21: [2023-05-10 12:37:42,332] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt. +21: [2023-05-10 12:37:42,332] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt. +21: [2023-05-10 12:37:42,332] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt. +11: [2023-05-10 12:37:42,332] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... + 5: [2023-05-10 12:37:42,334] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. + 5: [2023-05-10 12:37:42,334] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt... +24: [2023-05-10 12:37:42,334] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +24: [2023-05-10 12:37:42,334] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +24: [2023-05-10 12:37:42,334] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +24: [2023-05-10 12:37:42,334] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +24: [2023-05-10 12:37:42,335] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +24: [2023-05-10 12:37:42,335] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +24: [2023-05-10 12:37:42,336] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +24: [2023-05-10 12:37:42,336] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... + 3: [2023-05-10 12:37:42,336] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. + 3: [2023-05-10 12:37:42,336] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... + 9: [2023-05-10 12:37:42,337] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. + 9: [2023-05-10 12:37:42,337] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... + 9: [2023-05-10 12:37:42,337] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. + 3: [2023-05-10 12:37:42,337] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. + 9: [2023-05-10 12:37:42,337] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... + 5: [2023-05-10 12:37:42,337] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... + 9: [2023-05-10 12:37:42,337] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. + 9: [2023-05-10 12:37:42,337] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. + 3: [2023-05-10 12:37:42,338] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. + 3: [2023-05-10 12:37:42,338] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +23: [2023-05-10 12:37:42,339] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +23: [2023-05-10 12:37:42,339] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... + 9: [2023-05-10 12:37:42,339] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... + 9: [2023-05-10 12:37:42,339] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +23: [2023-05-10 12:37:42,339] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. + 3: [2023-05-10 12:37:42,339] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +23: [2023-05-10 12:37:42,339] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +11: [2023-05-10 12:37:42,340] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. + 3: [2023-05-10 12:37:42,340] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... + 3: [2023-05-10 12:37:42,340] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +23: [2023-05-10 12:37:42,340] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +11: [2023-05-10 12:37:42,340] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +23: [2023-05-10 12:37:42,340] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +11: [2023-05-10 12:37:42,340] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt... +11: [2023-05-10 12:37:42,340] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt... +19: [2023-05-10 12:37:42,340] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +19: [2023-05-10 12:37:42,340] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +19: [2023-05-10 12:37:42,340] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... + 6: [2023-05-10 12:37:42,340] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. + 6: [2023-05-10 12:37:42,340] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. + 6: [2023-05-10 12:37:42,340] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +19: [2023-05-10 12:37:42,340] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +19: [2023-05-10 12:37:42,341] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... + 6: [2023-05-10 12:37:42,341] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... + 6: [2023-05-10 12:37:42,341] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... + 6: [2023-05-10 12:37:42,341] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... + 6: [2023-05-10 12:37:42,341] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +19: [2023-05-10 12:37:42,341] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +19: [2023-05-10 12:37:42,341] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. + 6: [2023-05-10 12:37:42,341] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +13: [2023-05-10 12:37:42,341] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt. + 8: [2023-05-10 12:37:42,341] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +13: [2023-05-10 12:37:42,341] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt. +18: [2023-05-10 12:37:42,341] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +18: [2023-05-10 12:37:42,341] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +18: [2023-05-10 12:37:42,341] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +18: [2023-05-10 12:37:42,342] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +18: [2023-05-10 12:37:42,342] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +18: [2023-05-10 12:37:42,342] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +18: [2023-05-10 12:37:42,342] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. + 1: [2023-05-10 12:37:42,342] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. + 1: [2023-05-10 12:37:42,342] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +13: [2023-05-10 12:37:42,342] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt. + 1: [2023-05-10 12:37:42,342] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... + 1: [2023-05-10 12:37:42,342] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +13: [2023-05-10 12:37:42,342] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt. +23: [2023-05-10 12:37:42,342] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +19: [2023-05-10 12:37:42,342] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +11: [2023-05-10 12:37:42,342] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +11: [2023-05-10 12:37:42,342] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt... +23: [2023-05-10 12:37:42,342] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +21: [2023-05-10 12:37:42,342] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +12: [2023-05-10 12:37:42,342] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt. +12: [2023-05-10 12:37:42,343] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt. +12: [2023-05-10 12:37:42,343] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt. +10: [2023-05-10 12:37:42,343] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +10: [2023-05-10 12:37:42,343] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +10: [2023-05-10 12:37:42,343] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +12: [2023-05-10 12:37:42,343] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt. +10: [2023-05-10 12:37:42,343] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +10: [2023-05-10 12:37:42,343] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +10: [2023-05-10 12:37:42,343] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... + 1: [2023-05-10 12:37:42,343] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. + 1: [2023-05-10 12:37:42,343] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +11: [2023-05-10 12:37:42,343] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. + 7: [2023-05-10 12:37:42,343] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt. + 7: [2023-05-10 12:37:42,344] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt. + 7: [2023-05-10 12:37:42,344] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt. +10: [2023-05-10 12:37:42,344] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. + 7: [2023-05-10 12:37:42,344] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt. +23: [2023-05-10 12:37:42,344] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt. +23: [2023-05-10 12:37:42,344] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt. +23: [2023-05-10 12:37:42,344] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt. +23: [2023-05-10 12:37:42,344] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt. +21: [2023-05-10 12:37:42,344] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +21: [2023-05-10 12:37:42,345] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +21: [2023-05-10 12:37:42,345] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +11: [2023-05-10 12:37:42,345] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt... + 1: [2023-05-10 12:37:42,345] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +18: [2023-05-10 12:37:42,345] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... + 1: [2023-05-10 12:37:42,345] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +10: [2023-05-10 12:37:42,346] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +30: [2023-05-10 12:37:42,346] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +30: [2023-05-10 12:37:42,346] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +30: [2023-05-10 12:37:42,346] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt... +30: [2023-05-10 12:37:42,346] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt... + 5: [2023-05-10 12:37:42,346] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +24: [2023-05-10 12:37:42,346] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +28: [2023-05-10 12:37:42,347] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt. +28: [2023-05-10 12:37:42,347] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt. +28: [2023-05-10 12:37:42,347] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt. +17: [2023-05-10 12:37:42,347] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt. +28: [2023-05-10 12:37:42,347] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt. + 5: [2023-05-10 12:37:42,347] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt... +18: [2023-05-10 12:37:42,347] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt. +17: [2023-05-10 12:37:42,348] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt. +24: [2023-05-10 12:37:42,347] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. + 0: [2023-05-10 12:37:42,348] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt. +17: [2023-05-10 12:37:42,350] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt. +18: [2023-05-10 12:37:42,350] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt. + 0: [2023-05-10 12:37:42,350] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt. +13: [2023-05-10 12:37:42,351] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +18: [2023-05-10 12:37:42,350] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt. +18: [2023-05-10 12:37:42,351] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt. +25: [2023-05-10 12:37:42,351] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt. +12: [2023-05-10 12:37:42,351] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +25: [2023-05-10 12:37:42,351] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt. +17: [2023-05-10 12:37:42,351] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt. +26: [2023-05-10 12:37:42,351] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +26: [2023-05-10 12:37:42,351] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +13: [2023-05-10 12:37:42,352] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +26: [2023-05-10 12:37:42,352] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +26: [2023-05-10 12:37:42,352] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... + 9: [2023-05-10 12:37:42,351] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +25: [2023-05-10 12:37:42,352] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt. +13: [2023-05-10 12:37:42,352] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +26: [2023-05-10 12:37:42,352] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +26: [2023-05-10 12:37:42,352] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +25: [2023-05-10 12:37:42,352] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt. + 3: [2023-05-10 12:37:42,352] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. + 0: [2023-05-10 12:37:42,352] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt. + 0: [2023-05-10 12:37:42,353] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt. +13: [2023-05-10 12:37:42,353] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +27: [2023-05-10 12:37:42,353] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt. + 9: [2023-05-10 12:37:42,353] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +27: [2023-05-10 12:37:42,353] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt. +27: [2023-05-10 12:37:42,353] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt. +27: [2023-05-10 12:37:42,353] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt. +19: [2023-05-10 12:37:42,354] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +19: [2023-05-10 12:37:42,354] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. + 7: [2023-05-10 12:37:42,354] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... + 7: [2023-05-10 12:37:42,354] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +26: [2023-05-10 12:37:42,355] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +24: [2023-05-10 12:37:42,355] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... + 7: [2023-05-10 12:37:42,355] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +12: [2023-05-10 12:37:42,355] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +23: [2023-05-10 12:37:42,355] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +12: [2023-05-10 12:37:42,355] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +12: [2023-05-10 12:37:42,355] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +26: [2023-05-10 12:37:42,355] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... + 7: [2023-05-10 12:37:42,355] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +23: [2023-05-10 12:37:42,355] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... + 9: [2023-05-10 12:37:42,355] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt. +19: [2023-05-10 12:37:42,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. + 6: [2023-05-10 12:37:42,355] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. + 1: [2023-05-10 12:37:42,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt. + 1: [2023-05-10 12:37:42,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt. +28: [2023-05-10 12:37:42,356] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +15: [2023-05-10 12:37:42,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt. +15: [2023-05-10 12:37:42,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt. +15: [2023-05-10 12:37:42,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt. + 9: [2023-05-10 12:37:42,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt. +16: [2023-05-10 12:37:42,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt. + 1: [2023-05-10 12:37:42,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt. + 1: [2023-05-10 12:37:42,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt. +16: [2023-05-10 12:37:42,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt. +16: [2023-05-10 12:37:42,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt. +28: [2023-05-10 12:37:42,356] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +16: [2023-05-10 12:37:42,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt. +18: [2023-05-10 12:37:42,357] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +28: [2023-05-10 12:37:42,357] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +17: [2023-05-10 12:37:42,357] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... + 1: [2023-05-10 12:37:42,357] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +17: [2023-05-10 12:37:42,357] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... + 2: [2023-05-10 12:37:42,357] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt. + 0: [2023-05-10 12:37:42,357] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... + 6: [2023-05-10 12:37:42,357] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. + 6: [2023-05-10 12:37:42,357] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +23: [2023-05-10 12:37:42,358] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +24: [2023-05-10 12:37:42,358] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +10: [2023-05-10 12:37:42,358] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +23: [2023-05-10 12:37:42,358] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +15: [2023-05-10 12:37:42,358] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt. + 2: [2023-05-10 12:37:42,358] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt. +10: [2023-05-10 12:37:42,358] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt. +10: [2023-05-10 12:37:42,358] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt. +23: [2023-05-10 12:37:42,359] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +28: [2023-05-10 12:37:42,359] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +10: [2023-05-10 12:37:42,359] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt. +23: [2023-05-10 12:37:42,359] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +10: [2023-05-10 12:37:42,359] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt. +18: [2023-05-10 12:37:42,360] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... + 0: [2023-05-10 12:37:42,360] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +24: [2023-05-10 12:37:42,359] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. + 3: [2023-05-10 12:37:42,360] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt. +17: [2023-05-10 12:37:42,360] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +30: [2023-05-10 12:37:42,359] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. + 3: [2023-05-10 12:37:42,360] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt. + 3: [2023-05-10 12:37:42,360] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt. + 3: [2023-05-10 12:37:42,360] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt. +10: [2023-05-10 12:37:42,361] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +10: [2023-05-10 12:37:42,361] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. + 4: [2023-05-10 12:37:42,361] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt. + 4: [2023-05-10 12:37:42,361] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt. + 4: [2023-05-10 12:37:42,361] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt. +30: [2023-05-10 12:37:42,361] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. + 4: [2023-05-10 12:37:42,361] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt. +21: [2023-05-10 12:37:42,361] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +21: [2023-05-10 12:37:42,361] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +30: [2023-05-10 12:37:42,361] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt... +21: [2023-05-10 12:37:42,362] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt... +21: [2023-05-10 12:37:42,362] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt... +21: [2023-05-10 12:37:42,362] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +21: [2023-05-10 12:37:42,362] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +25: [2023-05-10 12:37:42,362] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +21: [2023-05-10 12:37:42,362] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt... +17: [2023-05-10 12:37:42,362] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +21: [2023-05-10 12:37:42,362] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt... + 9: [2023-05-10 12:37:42,362] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt. +25: [2023-05-10 12:37:42,362] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +30: [2023-05-10 12:37:42,362] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt... + 1: [2023-05-10 12:37:42,362] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. + 9: [2023-05-10 12:37:42,363] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt. + 3: [2023-05-10 12:37:42,363] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +24: [2023-05-10 12:37:42,363] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. + 0: [2023-05-10 12:37:42,363] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +19: [2023-05-10 12:37:42,363] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... + 6: [2023-05-10 12:37:42,363] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +25: [2023-05-10 12:37:42,363] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... + 9: [2023-05-10 12:37:42,363] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. + 0: [2023-05-10 12:37:42,363] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +27: [2023-05-10 12:37:42,364] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... + 2: [2023-05-10 12:37:42,364] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt. +27: [2023-05-10 12:37:42,364] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +27: [2023-05-10 12:37:42,364] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +27: [2023-05-10 12:37:42,364] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +25: [2023-05-10 12:37:42,364] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +26: [2023-05-10 12:37:42,364] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +19: [2023-05-10 12:37:42,364] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... + 2: [2023-05-10 12:37:42,364] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_13-model_01-model_states.pt. +26: [2023-05-10 12:37:42,365] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +23: [2023-05-10 12:37:42,364] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +18: [2023-05-10 12:37:42,365] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +18: [2023-05-10 12:37:42,365] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... + 9: [2023-05-10 12:37:42,365] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... + 9: [2023-05-10 12:37:42,365] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... + 1: [2023-05-10 12:37:42,366] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... + 9: [2023-05-10 12:37:42,366] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +16: [2023-05-10 12:37:42,366] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +16: [2023-05-10 12:37:42,366] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +13: [2023-05-10 12:37:42,365] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. + 1: [2023-05-10 12:37:42,366] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +16: [2023-05-10 12:37:42,366] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... + 7: [2023-05-10 12:37:42,366] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +13: [2023-05-10 12:37:42,366] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt... + 7: [2023-05-10 12:37:42,367] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt... +15: [2023-05-10 12:37:42,366] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +15: [2023-05-10 12:37:42,367] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... + 3: [2023-05-10 12:37:42,367] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +16: [2023-05-10 12:37:42,367] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +19: [2023-05-10 12:37:42,367] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +12: [2023-05-10 12:37:42,367] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. + 7: [2023-05-10 12:37:42,367] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. + 9: [2023-05-10 12:37:42,367] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... + 7: [2023-05-10 12:37:42,367] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt... + 6: [2023-05-10 12:37:42,367] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +28: [2023-05-10 12:37:42,367] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. + 6: [2023-05-10 12:37:42,368] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... + 9: [2023-05-10 12:37:42,368] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +28: [2023-05-10 12:37:42,368] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt... + 1: [2023-05-10 12:37:42,368] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +15: [2023-05-10 12:37:42,368] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +12: [2023-05-10 12:37:42,368] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt... +10: [2023-05-10 12:37:42,368] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... + 1: [2023-05-10 12:37:42,368] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +10: [2023-05-10 12:37:42,369] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +23: [2023-05-10 12:37:42,369] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +15: [2023-05-10 12:37:42,369] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +24: [2023-05-10 12:37:42,369] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... + 6: [2023-05-10 12:37:42,369] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... + 1: [2023-05-10 12:37:42,369] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +13: [2023-05-10 12:37:42,369] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +13: [2023-05-10 12:37:42,369] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt... +10: [2023-05-10 12:37:42,369] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... + 2: [2023-05-10 12:37:42,369] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... + 7: [2023-05-10 12:37:42,370] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +10: [2023-05-10 12:37:42,370] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... + 7: [2023-05-10 12:37:42,370] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +17: [2023-05-10 12:37:42,370] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. + 7: [2023-05-10 12:37:42,370] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt... + 7: [2023-05-10 12:37:42,370] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt... + 2: [2023-05-10 12:37:42,370] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +10: [2023-05-10 12:37:42,371] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +17: [2023-05-10 12:37:42,371] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt... +28: [2023-05-10 12:37:42,371] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +28: [2023-05-10 12:37:42,371] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +28: [2023-05-10 12:37:42,371] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt... +28: [2023-05-10 12:37:42,371] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt... +13: [2023-05-10 12:37:42,372] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +13: [2023-05-10 12:37:42,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt... +17: [2023-05-10 12:37:42,372] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +17: [2023-05-10 12:37:42,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt... + 6: [2023-05-10 12:37:42,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... + 4: [2023-05-10 12:37:42,373] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... + 1: [2023-05-10 12:37:42,373] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +18: [2023-05-10 12:37:42,373] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +26: [2023-05-10 12:37:42,373] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... + 9: [2023-05-10 12:37:42,373] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +10: [2023-05-10 12:37:42,373] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... + 3: [2023-05-10 12:37:42,373] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... + 9: [2023-05-10 12:37:42,373] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... + 3: [2023-05-10 12:37:42,373] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +18: [2023-05-10 12:37:42,373] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt... + 3: [2023-05-10 12:37:42,373] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... + 3: [2023-05-10 12:37:42,374] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +26: [2023-05-10 12:37:42,374] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +12: [2023-05-10 12:37:42,374] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +12: [2023-05-10 12:37:42,374] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +12: [2023-05-10 12:37:42,374] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt... +12: [2023-05-10 12:37:42,374] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt... +24: [2023-05-10 12:37:42,374] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... + 9: [2023-05-10 12:37:42,374] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... + 4: [2023-05-10 12:37:42,375] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... + 4: [2023-05-10 12:37:42,375] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... + 4: [2023-05-10 12:37:42,375] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +19: [2023-05-10 12:37:42,375] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +10: [2023-05-10 12:37:42,375] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... + 3: [2023-05-10 12:37:42,375] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +17: [2023-05-10 12:37:42,375] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +17: [2023-05-10 12:37:42,376] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt... + 6: [2023-05-10 12:37:42,376] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt. + 6: [2023-05-10 12:37:42,376] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt. + 6: [2023-05-10 12:37:42,376] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt. +25: [2023-05-10 12:37:42,376] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. + 6: [2023-05-10 12:37:42,376] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt. +23: [2023-05-10 12:37:42,376] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +25: [2023-05-10 12:37:42,376] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt... +23: [2023-05-10 12:37:42,376] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +27: [2023-05-10 12:37:42,376] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. + 2: [2023-05-10 12:37:42,377] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +17: [2023-05-10 12:37:42,377] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +17: [2023-05-10 12:37:42,377] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt... +23: [2023-05-10 12:37:42,377] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt... + 3: [2023-05-10 12:37:42,377] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... + 9: [2023-05-10 12:37:42,377] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... + 2: [2023-05-10 12:37:42,378] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt... +18: [2023-05-10 12:37:42,378] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +18: [2023-05-10 12:37:42,378] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +18: [2023-05-10 12:37:42,378] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +23: [2023-05-10 12:37:42,378] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +23: [2023-05-10 12:37:42,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt... +27: [2023-05-10 12:37:42,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt... +27: [2023-05-10 12:37:42,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +27: [2023-05-10 12:37:42,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +27: [2023-05-10 12:37:42,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +27: [2023-05-10 12:37:42,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt... +27: [2023-05-10 12:37:42,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt... +27: [2023-05-10 12:37:42,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt... + 0: [2023-05-10 12:37:42,380] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +18: [2023-05-10 12:37:42,380] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +18: [2023-05-10 12:37:42,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt... +23: [2023-05-10 12:37:42,381] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. + 0: [2023-05-10 12:37:42,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt... +23: [2023-05-10 12:37:42,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt... +16: [2023-05-10 12:37:42,381] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +16: [2023-05-10 12:37:42,381] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +16: [2023-05-10 12:37:42,381] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. + 1: [2023-05-10 12:37:42,381] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. + 0: [2023-05-10 12:37:42,381] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. + 0: [2023-05-10 12:37:42,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt... +25: [2023-05-10 12:37:42,381] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +16: [2023-05-10 12:37:42,382] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt... +16: [2023-05-10 12:37:42,382] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt... +16: [2023-05-10 12:37:42,382] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt... +25: [2023-05-10 12:37:42,382] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt... +12: [2023-05-10 12:37:42,381] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +23: [2023-05-10 12:37:42,382] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. + 1: [2023-05-10 12:37:42,382] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. + 1: [2023-05-10 12:37:42,382] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +23: [2023-05-10 12:37:42,382] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt... +15: [2023-05-10 12:37:42,383] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. + 1: [2023-05-10 12:37:42,383] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt... + 1: [2023-05-10 12:37:42,383] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt... + 9: [2023-05-10 12:37:42,382] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +10: [2023-05-10 12:37:42,383] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. + 9: [2023-05-10 12:37:42,383] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt... +12: [2023-05-10 12:37:42,383] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt... + 0: [2023-05-10 12:37:42,383] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. + 0: [2023-05-10 12:37:42,383] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. + 0: [2023-05-10 12:37:42,383] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt... +13: [2023-05-10 12:37:42,383] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. + 0: [2023-05-10 12:37:42,383] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt... +19: [2023-05-10 12:37:42,383] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... + 3: [2023-05-10 12:37:42,384] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +23: [2023-05-10 12:37:42,384] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. + 2: [2023-05-10 12:37:42,384] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +26: [2023-05-10 12:37:42,384] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +13: [2023-05-10 12:37:42,385] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt... + 6: [2023-05-10 12:37:42,385] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... + 6: [2023-05-10 12:37:42,385] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... + 6: [2023-05-10 12:37:42,385] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +23: [2023-05-10 12:37:42,385] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... + 6: [2023-05-10 12:37:42,385] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +10: [2023-05-10 12:37:42,385] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +28: [2023-05-10 12:37:42,385] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. + 3: [2023-05-10 12:37:42,385] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... + 3: [2023-05-10 12:37:42,386] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +22: [2023-05-10 12:37:42,386] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +22: [2023-05-10 12:37:42,386] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +22: [2023-05-10 12:37:42,386] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +10: [2023-05-10 12:37:42,386] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +22: [2023-05-10 12:37:42,386] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +10: [2023-05-10 12:37:42,386] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt... +10: [2023-05-10 12:37:42,386] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt... +25: [2023-05-10 12:37:42,386] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +15: [2023-05-10 12:37:42,386] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +22: [2023-05-10 12:37:42,386] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +22: [2023-05-10 12:37:42,387] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt. +22: [2023-05-10 12:37:42,387] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. + 3: [2023-05-10 12:37:42,387] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt... +22: [2023-05-10 12:37:42,387] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt. +22: [2023-05-10 12:37:42,387] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt. +22: [2023-05-10 12:37:42,387] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +15: [2023-05-10 12:37:42,387] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +22: [2023-05-10 12:37:42,387] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt. +26: [2023-05-10 12:37:42,387] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +25: [2023-05-10 12:37:42,387] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +15: [2023-05-10 12:37:42,387] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +28: [2023-05-10 12:37:42,387] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt... +25: [2023-05-10 12:37:42,388] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt... + 3: [2023-05-10 12:37:42,388] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. + 3: [2023-05-10 12:37:42,388] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt... +25: [2023-05-10 12:37:42,388] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt... + 2: [2023-05-10 12:37:42,388] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +15: [2023-05-10 12:37:42,389] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt... +15: [2023-05-10 12:37:42,389] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt... +15: [2023-05-10 12:37:42,389] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt... +15: [2023-05-10 12:37:42,389] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt... + 1: [2023-05-10 12:37:42,389] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. + 1: [2023-05-10 12:37:42,389] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt... + 1: [2023-05-10 12:37:42,389] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. + 9: [2023-05-10 12:37:42,388] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. + 9: [2023-05-10 12:37:42,389] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt... +22: [2023-05-10 12:37:42,389] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... + 2: [2023-05-10 12:37:42,389] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt... + 2: [2023-05-10 12:37:42,389] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt... +18: [2023-05-10 12:37:42,390] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... + 2: [2023-05-10 12:37:42,390] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +18: [2023-05-10 12:37:42,390] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +18: [2023-05-10 12:37:42,390] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... + 2: [2023-05-10 12:37:42,390] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt... +10: [2023-05-10 12:37:42,391] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. + 2: [2023-05-10 12:37:42,392] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +10: [2023-05-10 12:37:42,392] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +10: [2023-05-10 12:37:42,392] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... + 2: [2023-05-10 12:37:42,392] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt... + 4: [2023-05-10 12:37:42,392] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +10: [2023-05-10 12:37:42,392] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt... + 9: [2023-05-10 12:37:42,392] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. + 4: [2023-05-10 12:37:42,392] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +16: [2023-05-10 12:37:42,392] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. + 9: [2023-05-10 12:37:42,392] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt... +10: [2023-05-10 12:37:42,392] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt... + 4: [2023-05-10 12:37:42,392] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. + 4: [2023-05-10 12:37:42,393] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt... + 4: [2023-05-10 12:37:42,393] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt... + 4: [2023-05-10 12:37:42,393] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt... + 9: [2023-05-10 12:37:42,393] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. + 3: [2023-05-10 12:37:42,393] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. + 3: [2023-05-10 12:37:42,393] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt... +23: [2023-05-10 12:37:42,393] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +16: [2023-05-10 12:37:42,393] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt... + 3: [2023-05-10 12:37:42,393] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... + 1: [2023-05-10 12:37:42,394] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +26: [2023-05-10 12:37:42,394] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... + 9: [2023-05-10 12:37:42,394] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt... +18: [2023-05-10 12:37:42,394] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +18: [2023-05-10 12:37:42,394] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt... +19: [2023-05-10 12:37:42,393] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt. +19: [2023-05-10 12:37:42,394] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt. +19: [2023-05-10 12:37:42,394] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt. +19: [2023-05-10 12:37:42,395] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt. +26: [2023-05-10 12:37:42,396] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... + 4: [2023-05-10 12:37:42,397] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. + 4: [2023-05-10 12:37:42,397] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt... + 6: [2023-05-10 12:37:42,398] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. + 6: [2023-05-10 12:37:42,398] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt... + 1: [2023-05-10 12:37:42,399] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +22: [2023-05-10 12:37:42,400] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +22: [2023-05-10 12:37:42,400] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +31: [2023-05-10 12:37:42,400] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt. +31: [2023-05-10 12:37:42,400] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt. +31: [2023-05-10 12:37:42,401] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt. +31: [2023-05-10 12:37:42,401] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt. +22: [2023-05-10 12:37:42,403] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +18: [2023-05-10 12:37:42,403] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. + 6: [2023-05-10 12:37:42,403] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. + 6: [2023-05-10 12:37:42,403] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. + 6: [2023-05-10 12:37:42,403] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. + 6: [2023-05-10 12:37:42,403] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt... + 6: [2023-05-10 12:37:42,403] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt... + 3: [2023-05-10 12:37:42,404] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. + 6: [2023-05-10 12:37:42,403] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt... +19: [2023-05-10 12:37:42,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +22: [2023-05-10 12:37:42,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +19: [2023-05-10 12:37:42,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... + 3: [2023-05-10 12:37:42,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt... +19: [2023-05-10 12:37:42,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +18: [2023-05-10 12:37:42,406] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_00-model_states.pt. +19: [2023-05-10 12:37:42,406] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... + 1: [2023-05-10 12:37:42,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +18: [2023-05-10 12:37:42,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt... + 1: [2023-05-10 12:37:42,408] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt... +22: [2023-05-10 12:37:42,408] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +22: [2023-05-10 12:37:42,408] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +22: [2023-05-10 12:37:42,408] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +13: [2023-05-10 12:37:42,408] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +13: [2023-05-10 12:37:42,408] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +13: [2023-05-10 12:37:42,409] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +13: [2023-05-10 12:37:42,409] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +13: [2023-05-10 12:37:42,409] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +13: [2023-05-10 12:37:42,409] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +31: [2023-05-10 12:37:42,410] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +31: [2023-05-10 12:37:42,410] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +13: [2023-05-10 12:37:42,410] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +31: [2023-05-10 12:37:42,411] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +31: [2023-05-10 12:37:42,411] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +14: [2023-05-10 12:37:42,411] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt. +14: [2023-05-10 12:37:42,411] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt. +14: [2023-05-10 12:37:42,411] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt. +13: [2023-05-10 12:37:42,411] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +14: [2023-05-10 12:37:42,411] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt. +18: [2023-05-10 12:37:42,413] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +22: [2023-05-10 12:37:42,414] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +26: [2023-05-10 12:37:42,414] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt. +26: [2023-05-10 12:37:42,414] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt. +20: [2023-05-10 12:37:42,415] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt. +20: [2023-05-10 12:37:42,415] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt. +26: [2023-05-10 12:37:42,416] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt. +20: [2023-05-10 12:37:42,416] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt. +26: [2023-05-10 12:37:42,417] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt. +22: [2023-05-10 12:37:42,417] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt... +20: [2023-05-10 12:37:42,417] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt. +19: [2023-05-10 12:37:42,418] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +19: [2023-05-10 12:37:42,419] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt... +22: [2023-05-10 12:37:42,420] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +22: [2023-05-10 12:37:42,420] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +22: [2023-05-10 12:37:42,420] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +22: [2023-05-10 12:37:42,420] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +22: [2023-05-10 12:37:42,420] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +22: [2023-05-10 12:37:42,421] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt... +13: [2023-05-10 12:37:42,420] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +14: [2023-05-10 12:37:42,421] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +31: [2023-05-10 12:37:42,421] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +31: [2023-05-10 12:37:42,423] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt... +14: [2023-05-10 12:37:42,423] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +20: [2023-05-10 12:37:42,424] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +14: [2023-05-10 12:37:42,424] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +14: [2023-05-10 12:37:42,424] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +26: [2023-05-10 12:37:42,425] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +20: [2023-05-10 12:37:42,425] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +13: [2023-05-10 12:37:42,426] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +26: [2023-05-10 12:37:42,426] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +20: [2023-05-10 12:37:42,427] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +31: [2023-05-10 12:37:42,427] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +31: [2023-05-10 12:37:42,427] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt... +26: [2023-05-10 12:37:42,427] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +26: [2023-05-10 12:37:42,427] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +31: [2023-05-10 12:37:42,428] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +31: [2023-05-10 12:37:42,429] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt... +20: [2023-05-10 12:37:42,429] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +19: [2023-05-10 12:37:42,429] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +19: [2023-05-10 12:37:42,429] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +19: [2023-05-10 12:37:42,430] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt... +19: [2023-05-10 12:37:42,431] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt... +13: [2023-05-10 12:37:42,431] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +22: [2023-05-10 12:37:42,432] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +22: [2023-05-10 12:37:42,433] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... + 4: [2023-05-10 12:37:42,434] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. + 4: [2023-05-10 12:37:42,434] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +22: [2023-05-10 12:37:42,434] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt... +31: [2023-05-10 12:37:42,434] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. + 4: [2023-05-10 12:37:42,434] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... + 4: [2023-05-10 12:37:42,434] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +31: [2023-05-10 12:37:42,434] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt... + 4: [2023-05-10 12:37:42,434] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. + 4: [2023-05-10 12:37:42,435] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +19: [2023-05-10 12:37:42,434] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. + 4: [2023-05-10 12:37:42,435] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. + 4: [2023-05-10 12:37:42,435] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +13: [2023-05-10 12:37:42,436] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +19: [2023-05-10 12:37:42,436] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt... +20: [2023-05-10 12:37:42,437] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +20: [2023-05-10 12:37:42,437] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt... +26: [2023-05-10 12:37:42,438] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +26: [2023-05-10 12:37:42,438] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt... +22: [2023-05-10 12:37:42,438] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +22: [2023-05-10 12:37:42,441] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt... +13: [2023-05-10 12:37:42,441] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +20: [2023-05-10 12:37:42,442] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +20: [2023-05-10 12:37:42,442] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt... +20: [2023-05-10 12:37:42,443] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +26: [2023-05-10 12:37:42,443] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +20: [2023-05-10 12:37:42,443] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt... +26: [2023-05-10 12:37:42,443] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt... +20: [2023-05-10 12:37:42,446] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +20: [2023-05-10 12:37:42,447] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt... +26: [2023-05-10 12:37:42,448] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +26: [2023-05-10 12:37:42,448] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt... +26: [2023-05-10 12:37:42,449] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +26: [2023-05-10 12:37:42,449] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt... +13: [2023-05-10 12:37:42,450] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +13: [2023-05-10 12:37:42,450] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... + 4: [2023-05-10 12:37:42,450] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. + 4: [2023-05-10 12:37:42,451] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. + 2: [2023-05-10 12:37:42,452] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. + 2: [2023-05-10 12:37:42,452] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. + 2: [2023-05-10 12:37:42,452] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... + 2: [2023-05-10 12:37:42,452] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... + 4: [2023-05-10 12:37:42,452] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. + 4: [2023-05-10 12:37:42,453] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +29: [2023-05-10 12:37:42,453] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +29: [2023-05-10 12:37:42,453] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... + 2: [2023-05-10 12:37:42,453] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. + 2: [2023-05-10 12:37:42,453] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. + 2: [2023-05-10 12:37:42,453] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +29: [2023-05-10 12:37:42,454] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +29: [2023-05-10 12:37:42,455] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +29: [2023-05-10 12:37:42,455] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +29: [2023-05-10 12:37:42,455] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +29: [2023-05-10 12:37:42,456] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... + 2: [2023-05-10 12:37:42,456] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +29: [2023-05-10 12:37:42,457] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... + 5: [2023-05-10 12:37:42,457] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt. + 5: [2023-05-10 12:37:42,457] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt. +30: [2023-05-10 12:37:42,457] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +30: [2023-05-10 12:37:42,457] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +30: [2023-05-10 12:37:42,457] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +30: [2023-05-10 12:37:42,457] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +30: [2023-05-10 12:37:42,457] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. + 5: [2023-05-10 12:37:42,457] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt. +30: [2023-05-10 12:37:42,458] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +30: [2023-05-10 12:37:42,458] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. + 5: [2023-05-10 12:37:42,458] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt. +30: [2023-05-10 12:37:42,458] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +13: [2023-05-10 12:37:42,459] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... + 4: [2023-05-10 12:37:42,460] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +24: [2023-05-10 12:37:42,462] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt. +24: [2023-05-10 12:37:42,462] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt. + 2: [2023-05-10 12:37:42,463] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +24: [2023-05-10 12:37:42,463] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt. + 4: [2023-05-10 12:37:42,464] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +24: [2023-05-10 12:37:42,464] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt. + 8: [2023-05-10 12:37:42,464] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt. + 4: [2023-05-10 12:37:42,464] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... + 8: [2023-05-10 12:37:42,464] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt. +17: [2023-05-10 12:37:42,464] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +17: [2023-05-10 12:37:42,465] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +17: [2023-05-10 12:37:42,465] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +17: [2023-05-10 12:37:42,465] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +17: [2023-05-10 12:37:42,465] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +17: [2023-05-10 12:37:42,465] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +17: [2023-05-10 12:37:42,465] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... + 4: [2023-05-10 12:37:42,465] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +29: [2023-05-10 12:37:42,465] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +17: [2023-05-10 12:37:42,466] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +28: [2023-05-10 12:37:42,467] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +28: [2023-05-10 12:37:42,467] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +28: [2023-05-10 12:37:42,467] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +28: [2023-05-10 12:37:42,467] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +28: [2023-05-10 12:37:42,467] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +28: [2023-05-10 12:37:42,467] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. + 2: [2023-05-10 12:37:42,467] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. + 8: [2023-05-10 12:37:42,467] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt. + 8: [2023-05-10 12:37:42,467] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt. + 5: [2023-05-10 12:37:42,468] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +28: [2023-05-10 12:37:42,468] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +29: [2023-05-10 12:37:42,468] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. + 2: [2023-05-10 12:37:42,468] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +28: [2023-05-10 12:37:42,469] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +30: [2023-05-10 12:37:42,469] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. + 5: [2023-05-10 12:37:42,471] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... + 5: [2023-05-10 12:37:42,471] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +21: [2023-05-10 12:37:42,472] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +21: [2023-05-10 12:37:42,472] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +21: [2023-05-10 12:37:42,472] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +21: [2023-05-10 12:37:42,472] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +21: [2023-05-10 12:37:42,472] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +21: [2023-05-10 12:37:42,472] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +21: [2023-05-10 12:37:42,472] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. + 8: [2023-05-10 12:37:42,473] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +24: [2023-05-10 12:37:42,472] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +24: [2023-05-10 12:37:42,472] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +24: [2023-05-10 12:37:42,473] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +24: [2023-05-10 12:37:42,473] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... + 5: [2023-05-10 12:37:42,473] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... + 2: [2023-05-10 12:37:42,474] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +21: [2023-05-10 12:37:42,474] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +29: [2023-05-10 12:37:42,474] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +30: [2023-05-10 12:37:42,475] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. + 8: [2023-05-10 12:37:42,475] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +30: [2023-05-10 12:37:42,475] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +30: [2023-05-10 12:37:42,475] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +17: [2023-05-10 12:37:42,477] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +29: [2023-05-10 12:37:42,477] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... + 8: [2023-05-10 12:37:42,477] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... + 8: [2023-05-10 12:37:42,478] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... + 2: [2023-05-10 12:37:42,480] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... + 2: [2023-05-10 12:37:42,480] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +17: [2023-05-10 12:37:42,480] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +17: [2023-05-10 12:37:42,480] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt. +17: [2023-05-10 12:37:42,480] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt. +17: [2023-05-10 12:37:42,480] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +17: [2023-05-10 12:37:42,481] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt. +17: [2023-05-10 12:37:42,481] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt. +30: [2023-05-10 12:37:42,482] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +29: [2023-05-10 12:37:42,482] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +20: [2023-05-10 12:37:42,483] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +20: [2023-05-10 12:37:42,483] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +14: [2023-05-10 12:37:42,483] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +14: [2023-05-10 12:37:42,483] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +14: [2023-05-10 12:37:42,483] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +14: [2023-05-10 12:37:42,483] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +14: [2023-05-10 12:37:42,483] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +14: [2023-05-10 12:37:42,483] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +14: [2023-05-10 12:37:42,483] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +14: [2023-05-10 12:37:42,483] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +28: [2023-05-10 12:37:42,483] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +28: [2023-05-10 12:37:42,483] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +14: [2023-05-10 12:37:42,483] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +14: [2023-05-10 12:37:42,483] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +14: [2023-05-10 12:37:42,483] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +20: [2023-05-10 12:37:42,483] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. + 2: [2023-05-10 12:37:42,483] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +14: [2023-05-10 12:37:42,484] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt... +14: [2023-05-10 12:37:42,484] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt... + 0: [2023-05-10 12:37:42,484] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. + 0: [2023-05-10 12:37:42,484] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. + 0: [2023-05-10 12:37:42,484] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... + 0: [2023-05-10 12:37:42,484] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... + 0: [2023-05-10 12:37:42,484] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +20: [2023-05-10 12:37:42,484] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. + 0: [2023-05-10 12:37:42,484] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +20: [2023-05-10 12:37:42,484] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +14: [2023-05-10 12:37:42,485] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt... +20: [2023-05-10 12:37:42,485] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +20: [2023-05-10 12:37:42,485] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +20: [2023-05-10 12:37:42,485] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +24: [2023-05-10 12:37:42,485] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +24: [2023-05-10 12:37:42,485] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +14: [2023-05-10 12:37:42,485] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt... + 5: [2023-05-10 12:37:42,485] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +24: [2023-05-10 12:37:42,485] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt... +14: [2023-05-10 12:37:42,485] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... + 5: [2023-05-10 12:37:42,486] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt... + 0: [2023-05-10 12:37:42,486] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... + 0: [2023-05-10 12:37:42,486] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +24: [2023-05-10 12:37:42,486] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt... +29: [2023-05-10 12:37:42,486] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. + 8: [2023-05-10 12:37:42,486] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +21: [2023-05-10 12:37:42,486] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +21: [2023-05-10 12:37:42,487] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +24: [2023-05-10 12:37:42,487] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +24: [2023-05-10 12:37:42,487] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt... + 8: [2023-05-10 12:37:42,487] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt... +30: [2023-05-10 12:37:42,487] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +30: [2023-05-10 12:37:42,487] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +21: [2023-05-10 12:37:42,487] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +30: [2023-05-10 12:37:42,488] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +17: [2023-05-10 12:37:42,488] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +11: [2023-05-10 12:37:42,490] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +11: [2023-05-10 12:37:42,490] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +11: [2023-05-10 12:37:42,490] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +11: [2023-05-10 12:37:42,490] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +11: [2023-05-10 12:37:42,490] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +11: [2023-05-10 12:37:42,490] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +11: [2023-05-10 12:37:42,490] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +11: [2023-05-10 12:37:42,490] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +29: [2023-05-10 12:37:42,491] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +15: [2023-05-10 12:37:42,492] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +15: [2023-05-10 12:37:42,492] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +15: [2023-05-10 12:37:42,492] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +15: [2023-05-10 12:37:42,492] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +17: [2023-05-10 12:37:42,492] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +15: [2023-05-10 12:37:42,492] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +28: [2023-05-10 12:37:42,492] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +15: [2023-05-10 12:37:42,492] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +15: [2023-05-10 12:37:42,492] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +15: [2023-05-10 12:37:42,492] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +24: [2023-05-10 12:37:42,493] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +16: [2023-05-10 12:37:42,493] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +16: [2023-05-10 12:37:42,493] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +24: [2023-05-10 12:37:42,493] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt... +16: [2023-05-10 12:37:42,493] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +16: [2023-05-10 12:37:42,493] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... + 8: [2023-05-10 12:37:42,493] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. + 8: [2023-05-10 12:37:42,493] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... + 8: [2023-05-10 12:37:42,493] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. + 8: [2023-05-10 12:37:42,493] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +17: [2023-05-10 12:37:42,494] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... + 2: [2023-05-10 12:37:42,494] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +16: [2023-05-10 12:37:42,494] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +16: [2023-05-10 12:37:42,494] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +16: [2023-05-10 12:37:42,494] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +12: [2023-05-10 12:37:42,494] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +17: [2023-05-10 12:37:42,494] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +12: [2023-05-10 12:37:42,494] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +12: [2023-05-10 12:37:42,494] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +12: [2023-05-10 12:37:42,494] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +17: [2023-05-10 12:37:42,494] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +17: [2023-05-10 12:37:42,495] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +28: [2023-05-10 12:37:42,495] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +28: [2023-05-10 12:37:42,495] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +17: [2023-05-10 12:37:42,495] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +29: [2023-05-10 12:37:42,495] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +16: [2023-05-10 12:37:42,495] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +25: [2023-05-10 12:37:42,495] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +25: [2023-05-10 12:37:42,495] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. + 8: [2023-05-10 12:37:42,496] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +25: [2023-05-10 12:37:42,496] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +25: [2023-05-10 12:37:42,496] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... + 8: [2023-05-10 12:37:42,496] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt... +25: [2023-05-10 12:37:42,496] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +25: [2023-05-10 12:37:42,496] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +25: [2023-05-10 12:37:42,496] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. + 8: [2023-05-10 12:37:42,496] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. + 8: [2023-05-10 12:37:42,496] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. + 5: [2023-05-10 12:37:42,495] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. + 5: [2023-05-10 12:37:42,496] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. + 5: [2023-05-10 12:37:42,496] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt... +25: [2023-05-10 12:37:42,496] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +12: [2023-05-10 12:37:42,496] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +12: [2023-05-10 12:37:42,496] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. + 8: [2023-05-10 12:37:42,496] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +12: [2023-05-10 12:37:42,496] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +21: [2023-05-10 12:37:42,497] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... + 5: [2023-05-10 12:37:42,497] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt... +20: [2023-05-10 12:37:42,497] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +12: [2023-05-10 12:37:42,497] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +14: [2023-05-10 12:37:42,497] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +21: [2023-05-10 12:37:42,498] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +20: [2023-05-10 12:37:42,498] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. + 8: [2023-05-10 12:37:42,499] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +14: [2023-05-10 12:37:42,499] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +14: [2023-05-10 12:37:42,499] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +20: [2023-05-10 12:37:42,499] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +21: [2023-05-10 12:37:42,500] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... + 5: [2023-05-10 12:37:42,500] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. + 5: [2023-05-10 12:37:42,500] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... + 5: [2023-05-10 12:37:42,500] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +28: [2023-05-10 12:37:42,500] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... + 5: [2023-05-10 12:37:42,500] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... + 5: [2023-05-10 12:37:42,501] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. + 5: [2023-05-10 12:37:42,501] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. + 5: [2023-05-10 12:37:42,503] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +21: [2023-05-10 12:37:42,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. + 5: [2023-05-10 12:37:42,503] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... + 8: [2023-05-10 12:37:42,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. + 8: [2023-05-10 12:37:42,503] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt... +28: [2023-05-10 12:37:42,504] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +15: [2023-05-10 12:37:42,504] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. + 8: [2023-05-10 12:37:42,504] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. + 8: [2023-05-10 12:37:42,506] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. + 8: [2023-05-10 12:37:42,506] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt... +17: [2023-05-10 12:37:42,506] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +11: [2023-05-10 12:37:42,506] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +11: [2023-05-10 12:37:42,506] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +20: [2023-05-10 12:37:42,507] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +11: [2023-05-10 12:37:42,507] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +11: [2023-05-10 12:37:42,507] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +25: [2023-05-10 12:37:42,507] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +25: [2023-05-10 12:37:42,508] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +12: [2023-05-10 12:37:42,508] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +14: [2023-05-10 12:37:42,509] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +14: [2023-05-10 12:37:42,509] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +20: [2023-05-10 12:37:42,509] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +15: [2023-05-10 12:37:42,509] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. + 0: [2023-05-10 12:37:42,509] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. + 0: [2023-05-10 12:37:42,509] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +12: [2023-05-10 12:37:42,509] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. + 5: [2023-05-10 12:37:42,510] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +14: [2023-05-10 12:37:42,511] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +20: [2023-05-10 12:37:42,511] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +15: [2023-05-10 12:37:42,511] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +16: [2023-05-10 12:37:42,511] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +16: [2023-05-10 12:37:42,511] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +16: [2023-05-10 12:37:42,511] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +25: [2023-05-10 12:37:42,512] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +21: [2023-05-10 12:37:42,512] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... + 5: [2023-05-10 12:37:42,513] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt... + 5: [2023-05-10 12:37:42,513] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +14: [2023-05-10 12:37:42,514] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +15: [2023-05-10 12:37:42,514] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +15: [2023-05-10 12:37:42,514] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +28: [2023-05-10 12:37:42,514] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... + 8: [2023-05-10 12:37:42,514] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +20: [2023-05-10 12:37:42,515] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +17: [2023-05-10 12:37:42,515] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +25: [2023-05-10 12:37:42,515] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +17: [2023-05-10 12:37:42,515] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... + 8: [2023-05-10 12:37:42,516] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. + 8: [2023-05-10 12:37:42,516] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +17: [2023-05-10 12:37:42,516] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt... +31: [2023-05-10 12:37:42,517] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +31: [2023-05-10 12:37:42,517] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +31: [2023-05-10 12:37:42,517] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +31: [2023-05-10 12:37:42,517] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +31: [2023-05-10 12:37:42,517] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +25: [2023-05-10 12:37:42,517] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +31: [2023-05-10 12:37:42,517] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +31: [2023-05-10 12:37:42,517] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +31: [2023-05-10 12:37:42,517] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +12: [2023-05-10 12:37:42,518] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +25: [2023-05-10 12:37:42,518] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +12: [2023-05-10 12:37:42,518] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt. +12: [2023-05-10 12:37:42,518] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt. +18: [2023-05-10 12:37:42,518] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt. +18: [2023-05-10 12:37:42,518] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt. +18: [2023-05-10 12:37:42,518] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt. +18: [2023-05-10 12:37:42,518] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt. +11: [2023-05-10 12:37:42,519] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... + 5: [2023-05-10 12:37:42,519] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +12: [2023-05-10 12:37:42,519] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt. +12: [2023-05-10 12:37:42,519] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +11: [2023-05-10 12:37:42,519] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +11: [2023-05-10 12:37:42,519] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +12: [2023-05-10 12:37:42,519] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt. +12: [2023-05-10 12:37:42,520] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +16: [2023-05-10 12:37:42,521] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +17: [2023-05-10 12:37:42,521] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +17: [2023-05-10 12:37:42,521] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. + 0: [2023-05-10 12:37:42,521] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... + 0: [2023-05-10 12:37:42,522] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +11: [2023-05-10 12:37:42,522] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +16: [2023-05-10 12:37:42,522] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +16: [2023-05-10 12:37:42,522] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +17: [2023-05-10 12:37:42,523] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt... +17: [2023-05-10 12:37:42,523] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt... +25: [2023-05-10 12:37:42,523] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +14: [2023-05-10 12:37:42,523] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +25: [2023-05-10 12:37:42,523] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt. +17: [2023-05-10 12:37:42,523] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. + 0: [2023-05-10 12:37:42,523] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt. + 0: [2023-05-10 12:37:42,523] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt. +25: [2023-05-10 12:37:42,523] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt. + 1: [2023-05-10 12:37:42,523] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt. +20: [2023-05-10 12:37:42,524] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... + 1: [2023-05-10 12:37:42,524] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt. +21: [2023-05-10 12:37:42,524] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt. +21: [2023-05-10 12:37:42,524] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt. +21: [2023-05-10 12:37:42,524] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt. +11: [2023-05-10 12:37:42,525] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt. +11: [2023-05-10 12:37:42,525] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt. +17: [2023-05-10 12:37:42,525] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt... +21: [2023-05-10 12:37:42,525] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt. + 5: [2023-05-10 12:37:42,525] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... + 8: [2023-05-10 12:37:42,526] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +25: [2023-05-10 12:37:42,526] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt. +11: [2023-05-10 12:37:42,526] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt. +12: [2023-05-10 12:37:42,527] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +15: [2023-05-10 12:37:42,527] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +15: [2023-05-10 12:37:42,527] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +25: [2023-05-10 12:37:42,527] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt. +11: [2023-05-10 12:37:42,527] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt. +15: [2023-05-10 12:37:42,527] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +12: [2023-05-10 12:37:42,528] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +16: [2023-05-10 12:37:42,528] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +27: [2023-05-10 12:37:42,528] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt. +27: [2023-05-10 12:37:42,528] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt. +27: [2023-05-10 12:37:42,528] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt. +31: [2023-05-10 12:37:42,528] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. + 8: [2023-05-10 12:37:42,528] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +12: [2023-05-10 12:37:42,529] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +31: [2023-05-10 12:37:42,529] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +25: [2023-05-10 12:37:42,529] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +27: [2023-05-10 12:37:42,529] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt. +12: [2023-05-10 12:37:42,529] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +18: [2023-05-10 12:37:42,529] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +18: [2023-05-10 12:37:42,529] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +18: [2023-05-10 12:37:42,529] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... + 1: [2023-05-10 12:37:42,529] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt. +18: [2023-05-10 12:37:42,529] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +12: [2023-05-10 12:37:42,530] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. + 1: [2023-05-10 12:37:42,530] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt. + 0: [2023-05-10 12:37:42,530] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. + 0: [2023-05-10 12:37:42,530] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt. + 0: [2023-05-10 12:37:42,530] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt. + 5: [2023-05-10 12:37:42,531] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... + 0: [2023-05-10 12:37:42,532] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +31: [2023-05-10 12:37:42,532] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. + 9: [2023-05-10 12:37:42,532] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt. + 9: [2023-05-10 12:37:42,533] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt. + 9: [2023-05-10 12:37:42,533] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt. + 1: [2023-05-10 12:37:42,533] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +12: [2023-05-10 12:37:42,533] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +13: [2023-05-10 12:37:42,533] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt. +31: [2023-05-10 12:37:42,533] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +13: [2023-05-10 12:37:42,533] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt. +13: [2023-05-10 12:37:42,533] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt. +13: [2023-05-10 12:37:42,534] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt. +21: [2023-05-10 12:37:42,534] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +11: [2023-05-10 12:37:42,534] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... + 9: [2023-05-10 12:37:42,534] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt. +23: [2023-05-10 12:37:42,534] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt. +23: [2023-05-10 12:37:42,534] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt. +23: [2023-05-10 12:37:42,534] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt. +23: [2023-05-10 12:37:42,534] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt. +27: [2023-05-10 12:37:42,534] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +27: [2023-05-10 12:37:42,535] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +27: [2023-05-10 12:37:42,535] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +27: [2023-05-10 12:37:42,535] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... + 5: [2023-05-10 12:37:42,534] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +27: [2023-05-10 12:37:42,535] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +16: [2023-05-10 12:37:42,535] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt. +27: [2023-05-10 12:37:42,535] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +27: [2023-05-10 12:37:42,535] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +27: [2023-05-10 12:37:42,535] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +25: [2023-05-10 12:37:42,535] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +25: [2023-05-10 12:37:42,535] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +16: [2023-05-10 12:37:42,535] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt. +16: [2023-05-10 12:37:42,535] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt. + 7: [2023-05-10 12:37:42,536] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt. +16: [2023-05-10 12:37:42,536] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt. +11: [2023-05-10 12:37:42,536] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... + 7: [2023-05-10 12:37:42,536] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt. +25: [2023-05-10 12:37:42,536] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... + 7: [2023-05-10 12:37:42,536] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt. + 1: [2023-05-10 12:37:42,536] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... + 7: [2023-05-10 12:37:42,536] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt. + 0: [2023-05-10 12:37:42,536] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +27: [2023-05-10 12:37:42,537] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +25: [2023-05-10 12:37:42,537] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +21: [2023-05-10 12:37:42,537] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +11: [2023-05-10 12:37:42,537] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +21: [2023-05-10 12:37:42,537] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +21: [2023-05-10 12:37:42,537] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +27: [2023-05-10 12:37:42,538] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +27: [2023-05-10 12:37:42,538] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +11: [2023-05-10 12:37:42,538] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +10: [2023-05-10 12:37:42,538] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt. +10: [2023-05-10 12:37:42,538] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt. +31: [2023-05-10 12:37:42,538] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +10: [2023-05-10 12:37:42,538] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt. + 1: [2023-05-10 12:37:42,538] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +10: [2023-05-10 12:37:42,538] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt. +27: [2023-05-10 12:37:42,538] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... + 8: [2023-05-10 12:37:42,538] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. + 5: [2023-05-10 12:37:42,538] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. + 1: [2023-05-10 12:37:42,539] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... + 0: [2023-05-10 12:37:42,539] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +16: [2023-05-10 12:37:42,540] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +31: [2023-05-10 12:37:42,540] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +12: [2023-05-10 12:37:42,541] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... + 4: [2023-05-10 12:37:42,541] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt. + 4: [2023-05-10 12:37:42,541] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt. + 4: [2023-05-10 12:37:42,541] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt. + 4: [2023-05-10 12:37:42,541] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt. + 0: [2023-05-10 12:37:42,541] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... + 9: [2023-05-10 12:37:42,542] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... + 0: [2023-05-10 12:37:42,542] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +13: [2023-05-10 12:37:42,542] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +12: [2023-05-10 12:37:42,542] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +12: [2023-05-10 12:37:42,543] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt... +13: [2023-05-10 12:37:42,543] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +13: [2023-05-10 12:37:42,543] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... + 5: [2023-05-10 12:37:42,543] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... + 9: [2023-05-10 12:37:42,543] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... + 0: [2023-05-10 12:37:42,544] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +23: [2023-05-10 12:37:42,544] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +23: [2023-05-10 12:37:42,544] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +18: [2023-05-10 12:37:42,544] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +23: [2023-05-10 12:37:42,545] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +13: [2023-05-10 12:37:42,545] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +12: [2023-05-10 12:37:42,545] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +18: [2023-05-10 12:37:42,545] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt... +12: [2023-05-10 12:37:42,545] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt... +18: [2023-05-10 12:37:42,545] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +18: [2023-05-10 12:37:42,545] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt... +15: [2023-05-10 12:37:42,545] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt. +15: [2023-05-10 12:37:42,546] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt. +15: [2023-05-10 12:37:42,546] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt. + 9: [2023-05-10 12:37:42,546] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +15: [2023-05-10 12:37:42,546] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt. +16: [2023-05-10 12:37:42,546] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +16: [2023-05-10 12:37:42,546] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +23: [2023-05-10 12:37:42,546] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +16: [2023-05-10 12:37:42,546] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +11: [2023-05-10 12:37:42,546] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. + 9: [2023-05-10 12:37:42,546] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +16: [2023-05-10 12:37:42,546] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +11: [2023-05-10 12:37:42,546] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt... + 7: [2023-05-10 12:37:42,546] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +18: [2023-05-10 12:37:42,547] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +18: [2023-05-10 12:37:42,547] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +18: [2023-05-10 12:37:42,547] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt... +18: [2023-05-10 12:37:42,547] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt... + 8: [2023-05-10 12:37:42,547] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +31: [2023-05-10 12:37:42,547] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +10: [2023-05-10 12:37:42,547] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +10: [2023-05-10 12:37:42,547] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +31: [2023-05-10 12:37:42,547] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... + 5: [2023-05-10 12:37:42,548] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... + 7: [2023-05-10 12:37:42,548] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... + 7: [2023-05-10 12:37:42,549] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... + 7: [2023-05-10 12:37:42,549] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... + 1: [2023-05-10 12:37:42,549] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. + 1: [2023-05-10 12:37:42,549] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt... +12: [2023-05-10 12:37:42,550] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +25: [2023-05-10 12:37:42,550] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +12: [2023-05-10 12:37:42,550] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt... + 0: [2023-05-10 12:37:42,550] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... + 4: [2023-05-10 12:37:42,550] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... + 4: [2023-05-10 12:37:42,550] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... + 4: [2023-05-10 12:37:42,550] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... + 4: [2023-05-10 12:37:42,550] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +25: [2023-05-10 12:37:42,551] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt... +21: [2023-05-10 12:37:42,551] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +27: [2023-05-10 12:37:42,550] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +27: [2023-05-10 12:37:42,551] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +11: [2023-05-10 12:37:42,551] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +11: [2023-05-10 12:37:42,551] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt... +21: [2023-05-10 12:37:42,551] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt... +10: [2023-05-10 12:37:42,551] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +10: [2023-05-10 12:37:42,551] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +27: [2023-05-10 12:37:42,551] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt... +27: [2023-05-10 12:37:42,552] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +25: [2023-05-10 12:37:42,552] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +25: [2023-05-10 12:37:42,552] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt... + 1: [2023-05-10 12:37:42,552] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. + 1: [2023-05-10 12:37:42,553] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt... +11: [2023-05-10 12:37:42,553] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +11: [2023-05-10 12:37:42,553] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt... + 1: [2023-05-10 12:37:42,553] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. + 3: [2023-05-10 12:37:42,553] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt. + 1: [2023-05-10 12:37:42,554] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt... +26: [2023-05-10 12:37:42,554] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt. +26: [2023-05-10 12:37:42,554] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt. +26: [2023-05-10 12:37:42,554] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt. +26: [2023-05-10 12:37:42,554] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt. + 3: [2023-05-10 12:37:42,554] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt. + 3: [2023-05-10 12:37:42,554] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt. + 3: [2023-05-10 12:37:42,554] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt. +15: [2023-05-10 12:37:42,555] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... + 0: [2023-05-10 12:37:42,555] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +25: [2023-05-10 12:37:42,555] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +25: [2023-05-10 12:37:42,555] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt... + 0: [2023-05-10 12:37:42,555] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt... +27: [2023-05-10 12:37:42,555] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +24: [2023-05-10 12:37:42,556] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +24: [2023-05-10 12:37:42,556] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +15: [2023-05-10 12:37:42,556] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +24: [2023-05-10 12:37:42,556] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +24: [2023-05-10 12:37:42,556] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +24: [2023-05-10 12:37:42,556] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +24: [2023-05-10 12:37:42,556] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +13: [2023-05-10 12:37:42,556] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +24: [2023-05-10 12:37:42,557] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +24: [2023-05-10 12:37:42,557] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +15: [2023-05-10 12:37:42,557] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +13: [2023-05-10 12:37:42,557] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt... + 9: [2023-05-10 12:37:42,557] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. + 7: [2023-05-10 12:37:42,558] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. + 7: [2023-05-10 12:37:42,558] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. + 7: [2023-05-10 12:37:42,558] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... + 7: [2023-05-10 12:37:42,558] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... + 7: [2023-05-10 12:37:42,558] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. + 7: [2023-05-10 12:37:42,558] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... + 7: [2023-05-10 12:37:42,558] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +13: [2023-05-10 12:37:42,558] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +13: [2023-05-10 12:37:42,558] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +13: [2023-05-10 12:37:42,559] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt... +13: [2023-05-10 12:37:42,559] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt... + 7: [2023-05-10 12:37:42,559] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt... +27: [2023-05-10 12:37:42,559] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +27: [2023-05-10 12:37:42,559] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt... +25: [2023-05-10 12:37:42,559] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +15: [2023-05-10 12:37:42,559] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... + 9: [2023-05-10 12:37:42,560] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt... +27: [2023-05-10 12:37:42,560] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +27: [2023-05-10 12:37:42,560] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +27: [2023-05-10 12:37:42,560] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +11: [2023-05-10 12:37:42,560] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +27: [2023-05-10 12:37:42,560] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt... +27: [2023-05-10 12:37:42,560] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt... +23: [2023-05-10 12:37:42,560] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +23: [2023-05-10 12:37:42,560] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +27: [2023-05-10 12:37:42,560] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. + 7: [2023-05-10 12:37:42,560] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +16: [2023-05-10 12:37:42,560] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +25: [2023-05-10 12:37:42,561] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt... +11: [2023-05-10 12:37:42,561] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt... +23: [2023-05-10 12:37:42,561] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt... +23: [2023-05-10 12:37:42,561] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt... +12: [2023-05-10 12:37:42,561] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +21: [2023-05-10 12:37:42,561] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +21: [2023-05-10 12:37:42,562] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. + 7: [2023-05-10 12:37:42,562] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +16: [2023-05-10 12:37:42,562] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt... +21: [2023-05-10 12:37:42,562] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. + 3: [2023-05-10 12:37:42,563] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +13: [2023-05-10 12:37:42,563] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +21: [2023-05-10 12:37:42,563] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt... +13: [2023-05-10 12:37:42,563] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt... +21: [2023-05-10 12:37:42,563] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt... + 3: [2023-05-10 12:37:42,563] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +26: [2023-05-10 12:37:42,563] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... + 1: [2023-05-10 12:37:42,563] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. + 3: [2023-05-10 12:37:42,564] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... + 9: [2023-05-10 12:37:42,564] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +12: [2023-05-10 12:37:42,564] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt... + 9: [2023-05-10 12:37:42,564] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt... +10: [2023-05-10 12:37:42,564] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +27: [2023-05-10 12:37:42,564] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +26: [2023-05-10 12:37:42,564] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +21: [2023-05-10 12:37:42,564] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt... +10: [2023-05-10 12:37:42,564] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +10: [2023-05-10 12:37:42,564] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt... + 1: [2023-05-10 12:37:42,564] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt... +10: [2023-05-10 12:37:42,564] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt... + 0: [2023-05-10 12:37:42,565] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +16: [2023-05-10 12:37:42,565] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +16: [2023-05-10 12:37:42,565] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +16: [2023-05-10 12:37:42,565] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt... +16: [2023-05-10 12:37:42,565] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt... + 4: [2023-05-10 12:37:42,565] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +26: [2023-05-10 12:37:42,566] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... + 0: [2023-05-10 12:37:42,566] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt... + 3: [2023-05-10 12:37:42,566] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +27: [2023-05-10 12:37:42,566] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... + 4: [2023-05-10 12:37:42,567] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt... +26: [2023-05-10 12:37:42,567] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... + 4: [2023-05-10 12:37:42,567] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. + 4: [2023-05-10 12:37:42,567] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. + 4: [2023-05-10 12:37:42,567] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt... + 4: [2023-05-10 12:37:42,567] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt... +15: [2023-05-10 12:37:42,568] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +15: [2023-05-10 12:37:42,569] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt... +27: [2023-05-10 12:37:42,569] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +24: [2023-05-10 12:37:42,569] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. + 2: [2023-05-10 12:37:42,569] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt. + 2: [2023-05-10 12:37:42,569] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt. + 2: [2023-05-10 12:37:42,569] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt. + 2: [2023-05-10 12:37:42,569] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_14-model_01-model_states.pt. + 9: [2023-05-10 12:37:42,570] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +19: [2023-05-10 12:37:42,570] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +19: [2023-05-10 12:37:42,570] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. + 9: [2023-05-10 12:37:42,570] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt... +19: [2023-05-10 12:37:42,570] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +19: [2023-05-10 12:37:42,570] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +19: [2023-05-10 12:37:42,570] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +19: [2023-05-10 12:37:42,570] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +19: [2023-05-10 12:37:42,570] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +24: [2023-05-10 12:37:42,570] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +19: [2023-05-10 12:37:42,571] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +24: [2023-05-10 12:37:42,571] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +23: [2023-05-10 12:37:42,571] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +23: [2023-05-10 12:37:42,571] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +16: [2023-05-10 12:37:42,572] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +24: [2023-05-10 12:37:42,572] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. + 0: [2023-05-10 12:37:42,572] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +16: [2023-05-10 12:37:42,573] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt... +23: [2023-05-10 12:37:42,573] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt... +23: [2023-05-10 12:37:42,573] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt... + 0: [2023-05-10 12:37:42,573] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +15: [2023-05-10 12:37:42,573] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +15: [2023-05-10 12:37:42,574] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt... + 9: [2023-05-10 12:37:42,573] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. + 0: [2023-05-10 12:37:42,574] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt... + 7: [2023-05-10 12:37:42,574] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. + 0: [2023-05-10 12:37:42,575] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt... + 4: [2023-05-10 12:37:42,575] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. + 4: [2023-05-10 12:37:42,575] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt... + 9: [2023-05-10 12:37:42,575] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt... +10: [2023-05-10 12:37:42,576] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. + 3: [2023-05-10 12:37:42,577] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +10: [2023-05-10 12:37:42,577] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. + 3: [2023-05-10 12:37:42,577] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt... +10: [2023-05-10 12:37:42,577] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt... + 7: [2023-05-10 12:37:42,578] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +10: [2023-05-10 12:37:42,579] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt... +24: [2023-05-10 12:37:42,579] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... + 3: [2023-05-10 12:37:42,580] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. + 7: [2023-05-10 12:37:42,580] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt... + 2: [2023-05-10 12:37:42,580] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... + 3: [2023-05-10 12:37:42,580] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt... +24: [2023-05-10 12:37:42,580] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +15: [2023-05-10 12:37:42,580] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +15: [2023-05-10 12:37:42,581] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt... +26: [2023-05-10 12:37:42,581] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +24: [2023-05-10 12:37:42,581] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... + 7: [2023-05-10 12:37:42,581] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +19: [2023-05-10 12:37:42,581] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +19: [2023-05-10 12:37:42,581] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +26: [2023-05-10 12:37:42,581] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt... + 7: [2023-05-10 12:37:42,582] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. + 7: [2023-05-10 12:37:42,582] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. + 2: [2023-05-10 12:37:42,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +26: [2023-05-10 12:37:42,583] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +26: [2023-05-10 12:37:42,583] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt... + 3: [2023-05-10 12:37:42,583] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. + 2: [2023-05-10 12:37:42,583] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... + 3: [2023-05-10 12:37:42,583] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt... +19: [2023-05-10 12:37:42,584] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +24: [2023-05-10 12:37:42,584] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... + 7: [2023-05-10 12:37:42,585] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... + 7: [2023-05-10 12:37:42,585] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt... + 2: [2023-05-10 12:37:42,585] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt... +29: [2023-05-10 12:37:42,587] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt. +29: [2023-05-10 12:37:42,588] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt. +29: [2023-05-10 12:37:42,588] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt. +29: [2023-05-10 12:37:42,588] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt. +15: [2023-05-10 12:37:42,589] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. + 3: [2023-05-10 12:37:42,589] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +19: [2023-05-10 12:37:42,590] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... + 3: [2023-05-10 12:37:42,591] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt... +20: [2023-05-10 12:37:42,591] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt. + 7: [2023-05-10 12:37:42,591] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +20: [2023-05-10 12:37:42,591] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt. +15: [2023-05-10 12:37:42,591] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt... +20: [2023-05-10 12:37:42,591] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt. +20: [2023-05-10 12:37:42,592] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt. + 7: [2023-05-10 12:37:42,592] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. + 2: [2023-05-10 12:37:42,594] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. +26: [2023-05-10 12:37:42,595] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. + 7: [2023-05-10 12:37:42,594] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... + 7: [2023-05-10 12:37:42,594] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt... + 2: [2023-05-10 12:37:42,594] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt... +19: [2023-05-10 12:37:42,596] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +26: [2023-05-10 12:37:42,596] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +26: [2023-05-10 12:37:42,596] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt... +29: [2023-05-10 12:37:42,597] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +26: [2023-05-10 12:37:42,598] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt... +29: [2023-05-10 12:37:42,598] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +19: [2023-05-10 12:37:42,598] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +29: [2023-05-10 12:37:42,599] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +29: [2023-05-10 12:37:42,599] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... + 5: [2023-05-10 12:37:42,599] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt. +20: [2023-05-10 12:37:42,600] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +24: [2023-05-10 12:37:42,601] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt. +24: [2023-05-10 12:37:42,601] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt. + 5: [2023-05-10 12:37:42,601] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt. + 7: [2023-05-10 12:37:42,601] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +24: [2023-05-10 12:37:42,601] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt. +24: [2023-05-10 12:37:42,602] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt. +20: [2023-05-10 12:37:42,602] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +19: [2023-05-10 12:37:42,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +20: [2023-05-10 12:37:42,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +20: [2023-05-10 12:37:42,604] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... + 6: [2023-05-10 12:37:42,604] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt. + 5: [2023-05-10 12:37:42,604] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt. + 6: [2023-05-10 12:37:42,604] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt. + 6: [2023-05-10 12:37:42,604] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt. + 6: [2023-05-10 12:37:42,605] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt. + 8: [2023-05-10 12:37:42,605] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt. + 8: [2023-05-10 12:37:42,605] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt. + 8: [2023-05-10 12:37:42,605] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt. + 8: [2023-05-10 12:37:42,605] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt. + 1: [2023-05-10 12:37:42,606] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. + 1: [2023-05-10 12:37:42,606] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. + 1: [2023-05-10 12:37:42,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... + 1: [2023-05-10 12:37:42,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... + 9: [2023-05-10 12:37:42,607] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. + 9: [2023-05-10 12:37:42,607] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... + 1: [2023-05-10 12:37:42,607] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. + 1: [2023-05-10 12:37:42,607] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +28: [2023-05-10 12:37:42,608] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt. +28: [2023-05-10 12:37:42,608] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt. + 9: [2023-05-10 12:37:42,608] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +28: [2023-05-10 12:37:42,608] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt. +17: [2023-05-10 12:37:42,608] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt. +17: [2023-05-10 12:37:42,608] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt. +17: [2023-05-10 12:37:42,608] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt. +28: [2023-05-10 12:37:42,608] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt. +17: [2023-05-10 12:37:42,608] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt. + 5: [2023-05-10 12:37:42,609] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... + 5: [2023-05-10 12:37:42,609] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt. + 9: [2023-05-10 12:37:42,610] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. + 9: [2023-05-10 12:37:42,610] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... + 7: [2023-05-10 12:37:42,610] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... + 9: [2023-05-10 12:37:42,610] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. + 5: [2023-05-10 12:37:42,610] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... + 1: [2023-05-10 12:37:42,610] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. + 1: [2023-05-10 12:37:42,611] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... + 2: [2023-05-10 12:37:42,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. + 9: [2023-05-10 12:37:42,611] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +29: [2023-05-10 12:37:42,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +19: [2023-05-10 12:37:42,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +29: [2023-05-10 12:37:42,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt... +24: [2023-05-10 12:37:42,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +20: [2023-05-10 12:37:42,612] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +24: [2023-05-10 12:37:42,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +20: [2023-05-10 12:37:42,613] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt... + 3: [2023-05-10 12:37:42,613] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +24: [2023-05-10 12:37:42,613] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... + 3: [2023-05-10 12:37:42,613] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... + 3: [2023-05-10 12:37:42,613] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. + 3: [2023-05-10 12:37:42,613] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. + 3: [2023-05-10 12:37:42,613] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. + 2: [2023-05-10 12:37:42,612] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. + 3: [2023-05-10 12:37:42,613] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... + 3: [2023-05-10 12:37:42,613] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... + 3: [2023-05-10 12:37:42,613] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... + 2: [2023-05-10 12:37:42,613] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_00-model_states.pt. + 9: [2023-05-10 12:37:42,613] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... + 6: [2023-05-10 12:37:42,613] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... + 6: [2023-05-10 12:37:42,614] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... + 2: [2023-05-10 12:37:42,614] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt... + 6: [2023-05-10 12:37:42,614] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +24: [2023-05-10 12:37:42,614] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... + 8: [2023-05-10 12:37:42,615] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... + 5: [2023-05-10 12:37:42,615] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... + 8: [2023-05-10 12:37:42,615] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... + 6: [2023-05-10 12:37:42,615] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... + 2: [2023-05-10 12:37:42,616] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt... +29: [2023-05-10 12:37:42,615] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +29: [2023-05-10 12:37:42,615] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt... + 2: [2023-05-10 12:37:42,616] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt... + 8: [2023-05-10 12:37:42,616] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +30: [2023-05-10 12:37:42,617] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt. + 8: [2023-05-10 12:37:42,617] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +28: [2023-05-10 12:37:42,618] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +28: [2023-05-10 12:37:42,618] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +17: [2023-05-10 12:37:42,618] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +17: [2023-05-10 12:37:42,618] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +30: [2023-05-10 12:37:42,618] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt. +28: [2023-05-10 12:37:42,618] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +28: [2023-05-10 12:37:42,618] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +17: [2023-05-10 12:37:42,619] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +17: [2023-05-10 12:37:42,619] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... + 5: [2023-05-10 12:37:42,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... + 9: [2023-05-10 12:37:42,620] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +30: [2023-05-10 12:37:42,621] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt. +20: [2023-05-10 12:37:42,621] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +20: [2023-05-10 12:37:42,622] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt... +30: [2023-05-10 12:37:42,622] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt. + 1: [2023-05-10 12:37:42,622] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. + 1: [2023-05-10 12:37:42,622] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. + 5: [2023-05-10 12:37:42,623] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. + 5: [2023-05-10 12:37:42,624] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt... + 3: [2023-05-10 12:37:42,625] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +24: [2023-05-10 12:37:42,625] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +24: [2023-05-10 12:37:42,625] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt... +24: [2023-05-10 12:37:42,626] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +29: [2023-05-10 12:37:42,625] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +29: [2023-05-10 12:37:42,625] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +24: [2023-05-10 12:37:42,626] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt... +24: [2023-05-10 12:37:42,626] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +24: [2023-05-10 12:37:42,626] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt... +29: [2023-05-10 12:37:42,627] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt... +29: [2023-05-10 12:37:42,627] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt... + 1: [2023-05-10 12:37:42,627] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +20: [2023-05-10 12:37:42,628] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +30: [2023-05-10 12:37:42,628] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... + 1: [2023-05-10 12:37:42,629] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +30: [2023-05-10 12:37:42,629] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... + 6: [2023-05-10 12:37:42,629] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. + 6: [2023-05-10 12:37:42,629] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. + 6: [2023-05-10 12:37:42,629] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +20: [2023-05-10 12:37:42,630] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt... +30: [2023-05-10 12:37:42,630] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +20: [2023-05-10 12:37:42,630] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. + 9: [2023-05-10 12:37:42,630] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... + 6: [2023-05-10 12:37:42,630] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. + 6: [2023-05-10 12:37:42,630] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. + 6: [2023-05-10 12:37:42,631] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... + 6: [2023-05-10 12:37:42,631] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... + 8: [2023-05-10 12:37:42,630] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. + 8: [2023-05-10 12:37:42,631] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt... + 6: [2023-05-10 12:37:42,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. + 1: [2023-05-10 12:37:42,632] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... + 6: [2023-05-10 12:37:42,632] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt... + 1: [2023-05-10 12:37:42,632] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +22: [2023-05-10 12:37:42,632] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt. +22: [2023-05-10 12:37:42,632] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt. +22: [2023-05-10 12:37:42,632] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt. +22: [2023-05-10 12:37:42,632] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt. +20: [2023-05-10 12:37:42,632] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt... +28: [2023-05-10 12:37:42,633] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +30: [2023-05-10 12:37:42,633] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +28: [2023-05-10 12:37:42,633] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt... +28: [2023-05-10 12:37:42,633] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +28: [2023-05-10 12:37:42,633] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt... + 3: [2023-05-10 12:37:42,634] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. + 3: [2023-05-10 12:37:42,634] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. + 3: [2023-05-10 12:37:42,634] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. + 9: [2023-05-10 12:37:42,635] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. + 5: [2023-05-10 12:37:42,635] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. + 5: [2023-05-10 12:37:42,635] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt... + 5: [2023-05-10 12:37:42,635] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. + 5: [2023-05-10 12:37:42,635] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt... +17: [2023-05-10 12:37:42,635] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +17: [2023-05-10 12:37:42,635] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. + 6: [2023-05-10 12:37:42,635] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +17: [2023-05-10 12:37:42,635] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt... +17: [2023-05-10 12:37:42,635] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt... + 3: [2023-05-10 12:37:42,636] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +17: [2023-05-10 12:37:42,635] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. + 6: [2023-05-10 12:37:42,636] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. + 6: [2023-05-10 12:37:42,636] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +17: [2023-05-10 12:37:42,636] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt... + 6: [2023-05-10 12:37:42,636] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt... + 6: [2023-05-10 12:37:42,636] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt... + 8: [2023-05-10 12:37:42,636] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. + 8: [2023-05-10 12:37:42,636] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt... +28: [2023-05-10 12:37:42,636] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +28: [2023-05-10 12:37:42,636] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt... + 9: [2023-05-10 12:37:42,637] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. + 1: [2023-05-10 12:37:42,639] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... + 6: [2023-05-10 12:37:42,639] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. + 6: [2023-05-10 12:37:42,639] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt... +24: [2023-05-10 12:37:42,639] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. + 1: [2023-05-10 12:37:42,639] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +24: [2023-05-10 12:37:42,641] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt... +17: [2023-05-10 12:37:42,641] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +17: [2023-05-10 12:37:42,641] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt... +23: [2023-05-10 12:37:42,641] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +23: [2023-05-10 12:37:42,641] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +23: [2023-05-10 12:37:42,641] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +23: [2023-05-10 12:37:42,641] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +23: [2023-05-10 12:37:42,641] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +23: [2023-05-10 12:37:42,641] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +23: [2023-05-10 12:37:42,641] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +23: [2023-05-10 12:37:42,641] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +28: [2023-05-10 12:37:42,642] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. + 9: [2023-05-10 12:37:42,643] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. + 9: [2023-05-10 12:37:42,643] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +22: [2023-05-10 12:37:42,643] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +28: [2023-05-10 12:37:42,643] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt... +22: [2023-05-10 12:37:42,644] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +30: [2023-05-10 12:37:42,643] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. + 6: [2023-05-10 12:37:42,643] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +30: [2023-05-10 12:37:42,644] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt... +22: [2023-05-10 12:37:42,644] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... + 5: [2023-05-10 12:37:42,644] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. + 5: [2023-05-10 12:37:42,645] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt... + 8: [2023-05-10 12:37:42,645] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. + 3: [2023-05-10 12:37:42,646] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... + 9: [2023-05-10 12:37:42,646] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +30: [2023-05-10 12:37:42,646] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +30: [2023-05-10 12:37:42,646] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt... +22: [2023-05-10 12:37:42,646] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... + 3: [2023-05-10 12:37:42,646] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... + 3: [2023-05-10 12:37:42,646] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +14: [2023-05-10 12:37:42,646] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt. +14: [2023-05-10 12:37:42,646] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt. + 8: [2023-05-10 12:37:42,647] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt... + 8: [2023-05-10 12:37:42,647] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. + 6: [2023-05-10 12:37:42,648] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +10: [2023-05-10 12:37:42,649] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +10: [2023-05-10 12:37:42,649] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +14: [2023-05-10 12:37:42,649] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt. + 1: [2023-05-10 12:37:42,649] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt. + 1: [2023-05-10 12:37:42,649] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt. + 8: [2023-05-10 12:37:42,649] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt... +10: [2023-05-10 12:37:42,649] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +10: [2023-05-10 12:37:42,649] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +14: [2023-05-10 12:37:42,650] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt. +30: [2023-05-10 12:37:42,650] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +30: [2023-05-10 12:37:42,650] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt... +10: [2023-05-10 12:37:42,650] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. + 1: [2023-05-10 12:37:42,650] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt. +10: [2023-05-10 12:37:42,650] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... + 1: [2023-05-10 12:37:42,650] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt. +10: [2023-05-10 12:37:42,651] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +10: [2023-05-10 12:37:42,651] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... + 9: [2023-05-10 12:37:42,652] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +30: [2023-05-10 12:37:42,652] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +23: [2023-05-10 12:37:42,652] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +23: [2023-05-10 12:37:42,653] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +30: [2023-05-10 12:37:42,653] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt... +23: [2023-05-10 12:37:42,655] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. + 6: [2023-05-10 12:37:42,655] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +23: [2023-05-10 12:37:42,656] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +14: [2023-05-10 12:37:42,656] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +14: [2023-05-10 12:37:42,656] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... + 6: [2023-05-10 12:37:42,657] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... + 6: [2023-05-10 12:37:42,659] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. + 1: [2023-05-10 12:37:42,659] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +14: [2023-05-10 12:37:42,659] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +14: [2023-05-10 12:37:42,660] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... + 1: [2023-05-10 12:37:42,660] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... + 1: [2023-05-10 12:37:42,660] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +10: [2023-05-10 12:37:42,660] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. + 1: [2023-05-10 12:37:42,661] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +23: [2023-05-10 12:37:42,662] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +23: [2023-05-10 12:37:42,664] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +26: [2023-05-10 12:37:42,664] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +26: [2023-05-10 12:37:42,665] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +26: [2023-05-10 12:37:42,665] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +26: [2023-05-10 12:37:42,665] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +26: [2023-05-10 12:37:42,665] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +26: [2023-05-10 12:37:42,665] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +26: [2023-05-10 12:37:42,665] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +26: [2023-05-10 12:37:42,665] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +10: [2023-05-10 12:37:42,668] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +23: [2023-05-10 12:37:42,668] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... + 6: [2023-05-10 12:37:42,668] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +10: [2023-05-10 12:37:42,668] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... + 6: [2023-05-10 12:37:42,669] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +23: [2023-05-10 12:37:42,670] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... + 1: [2023-05-10 12:37:42,675] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. + 1: [2023-05-10 12:37:42,676] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt... +26: [2023-05-10 12:37:42,677] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +26: [2023-05-10 12:37:42,677] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. + 1: [2023-05-10 12:37:42,679] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +26: [2023-05-10 12:37:42,679] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +10: [2023-05-10 12:37:42,679] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... + 6: [2023-05-10 12:37:42,678] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... + 1: [2023-05-10 12:37:42,679] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt... +10: [2023-05-10 12:37:42,681] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +26: [2023-05-10 12:37:42,682] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. + 1: [2023-05-10 12:37:42,684] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. + 1: [2023-05-10 12:37:42,684] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt... +26: [2023-05-10 12:37:42,685] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +26: [2023-05-10 12:37:42,686] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +10: [2023-05-10 12:37:42,687] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. + 1: [2023-05-10 12:37:42,687] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. + 1: [2023-05-10 12:37:42,688] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt... +10: [2023-05-10 12:37:42,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +26: [2023-05-10 12:37:42,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +26: [2023-05-10 12:37:42,695] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +19: [2023-05-10 12:37:42,696] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt. +19: [2023-05-10 12:37:42,696] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt. +10: [2023-05-10 12:37:42,696] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +18: [2023-05-10 12:37:42,696] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +18: [2023-05-10 12:37:42,696] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +18: [2023-05-10 12:37:42,696] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +18: [2023-05-10 12:37:42,696] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +18: [2023-05-10 12:37:42,696] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +18: [2023-05-10 12:37:42,696] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +18: [2023-05-10 12:37:42,697] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +18: [2023-05-10 12:37:42,697] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +11: [2023-05-10 12:37:42,697] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt. +11: [2023-05-10 12:37:42,697] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt. +11: [2023-05-10 12:37:42,698] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt. +11: [2023-05-10 12:37:42,698] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt. +19: [2023-05-10 12:37:42,697] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt. +19: [2023-05-10 12:37:42,698] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt. +10: [2023-05-10 12:37:42,703] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt. +10: [2023-05-10 12:37:42,703] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt. +10: [2023-05-10 12:37:42,704] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt. +10: [2023-05-10 12:37:42,704] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt. +19: [2023-05-10 12:37:42,706] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... + 0: [2023-05-10 12:37:42,706] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt. + 0: [2023-05-10 12:37:42,707] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt. +11: [2023-05-10 12:37:42,707] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +19: [2023-05-10 12:37:42,707] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +19: [2023-05-10 12:37:42,707] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +11: [2023-05-10 12:37:42,708] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +31: [2023-05-10 12:37:42,707] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt. +31: [2023-05-10 12:37:42,707] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt. +31: [2023-05-10 12:37:42,707] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt. +11: [2023-05-10 12:37:42,708] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +31: [2023-05-10 12:37:42,708] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt. +19: [2023-05-10 12:37:42,708] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +11: [2023-05-10 12:37:42,709] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... + 0: [2023-05-10 12:37:42,712] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt. + 0: [2023-05-10 12:37:42,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt. +10: [2023-05-10 12:37:42,714] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +10: [2023-05-10 12:37:42,714] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... + 0: [2023-05-10 12:37:42,716] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... + 0: [2023-05-10 12:37:42,716] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +31: [2023-05-10 12:37:42,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +10: [2023-05-10 12:37:42,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +31: [2023-05-10 12:37:42,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +31: [2023-05-10 12:37:42,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... + 7: [2023-05-10 12:37:42,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt. +10: [2023-05-10 12:37:42,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... + 7: [2023-05-10 12:37:42,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt. +31: [2023-05-10 12:37:42,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... + 7: [2023-05-10 12:37:42,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt. + 7: [2023-05-10 12:37:42,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt. +11: [2023-05-10 12:37:42,721] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +18: [2023-05-10 12:37:42,721] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +18: [2023-05-10 12:37:42,721] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +18: [2023-05-10 12:37:42,721] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +19: [2023-05-10 12:37:42,721] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +18: [2023-05-10 12:37:42,722] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +11: [2023-05-10 12:37:42,722] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt... +19: [2023-05-10 12:37:42,722] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt... +19: [2023-05-10 12:37:42,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +19: [2023-05-10 12:37:42,723] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt... +11: [2023-05-10 12:37:42,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +11: [2023-05-10 12:37:42,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt... +19: [2023-05-10 12:37:42,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +19: [2023-05-10 12:37:42,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt... + 0: [2023-05-10 12:37:42,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... + 0: [2023-05-10 12:37:42,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... + 7: [2023-05-10 12:37:42,727] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... + 7: [2023-05-10 12:37:42,728] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... + 7: [2023-05-10 12:37:42,728] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... + 7: [2023-05-10 12:37:42,728] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +19: [2023-05-10 12:37:42,729] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +19: [2023-05-10 12:37:42,729] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt... +11: [2023-05-10 12:37:42,730] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +11: [2023-05-10 12:37:42,730] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt... +10: [2023-05-10 12:37:42,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +10: [2023-05-10 12:37:42,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +10: [2023-05-10 12:37:42,732] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt... +10: [2023-05-10 12:37:42,732] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt... +10: [2023-05-10 12:37:42,732] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +10: [2023-05-10 12:37:42,732] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt... +18: [2023-05-10 12:37:42,733] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... + 0: [2023-05-10 12:37:42,733] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +18: [2023-05-10 12:37:42,733] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +21: [2023-05-10 12:37:42,733] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt. +21: [2023-05-10 12:37:42,733] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt. +21: [2023-05-10 12:37:42,734] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt. +31: [2023-05-10 12:37:42,734] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +21: [2023-05-10 12:37:42,734] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt. + 5: [2023-05-10 12:37:42,734] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt. +31: [2023-05-10 12:37:42,734] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt... + 5: [2023-05-10 12:37:42,734] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt. +11: [2023-05-10 12:37:42,734] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. + 5: [2023-05-10 12:37:42,734] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt. + 5: [2023-05-10 12:37:42,734] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt. +18: [2023-05-10 12:37:42,735] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +31: [2023-05-10 12:37:42,735] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +31: [2023-05-10 12:37:42,735] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt... +16: [2023-05-10 12:37:42,735] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt. +16: [2023-05-10 12:37:42,735] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt. +16: [2023-05-10 12:37:42,735] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt. +16: [2023-05-10 12:37:42,735] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt. +11: [2023-05-10 12:37:42,736] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt... +10: [2023-05-10 12:37:42,736] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +10: [2023-05-10 12:37:42,736] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt... +18: [2023-05-10 12:37:42,736] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... + 2: [2023-05-10 12:37:42,737] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. + 2: [2023-05-10 12:37:42,737] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. + 2: [2023-05-10 12:37:42,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... + 2: [2023-05-10 12:37:42,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +31: [2023-05-10 12:37:42,737] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. + 0: [2023-05-10 12:37:42,737] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +31: [2023-05-10 12:37:42,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt... + 0: [2023-05-10 12:37:42,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt... + 0: [2023-05-10 12:37:42,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt... +31: [2023-05-10 12:37:42,739] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. + 2: [2023-05-10 12:37:42,739] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. + 2: [2023-05-10 12:37:42,739] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. + 2: [2023-05-10 12:37:42,739] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +31: [2023-05-10 12:37:42,740] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt... +13: [2023-05-10 12:37:42,740] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +13: [2023-05-10 12:37:42,740] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +13: [2023-05-10 12:37:42,741] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +13: [2023-05-10 12:37:42,741] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... + 2: [2023-05-10 12:37:42,741] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +13: [2023-05-10 12:37:42,742] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +13: [2023-05-10 12:37:42,742] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +13: [2023-05-10 12:37:42,742] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +22: [2023-05-10 12:37:42,743] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +22: [2023-05-10 12:37:42,743] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +22: [2023-05-10 12:37:42,743] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +22: [2023-05-10 12:37:42,743] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +22: [2023-05-10 12:37:42,743] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +22: [2023-05-10 12:37:42,743] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +22: [2023-05-10 12:37:42,743] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +22: [2023-05-10 12:37:42,743] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +22: [2023-05-10 12:37:42,743] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +22: [2023-05-10 12:37:42,743] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +13: [2023-05-10 12:37:42,743] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +22: [2023-05-10 12:37:42,743] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt... +21: [2023-05-10 12:37:42,743] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +22: [2023-05-10 12:37:42,743] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt... +22: [2023-05-10 12:37:42,743] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +22: [2023-05-10 12:37:42,743] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt... +16: [2023-05-10 12:37:42,744] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +21: [2023-05-10 12:37:42,744] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... + 5: [2023-05-10 12:37:42,744] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +21: [2023-05-10 12:37:42,744] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +21: [2023-05-10 12:37:42,744] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +16: [2023-05-10 12:37:42,744] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +16: [2023-05-10 12:37:42,744] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +16: [2023-05-10 12:37:42,745] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +22: [2023-05-10 12:37:42,745] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt... +23: [2023-05-10 12:37:42,745] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt. +23: [2023-05-10 12:37:42,745] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt. +23: [2023-05-10 12:37:42,745] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt. + 0: [2023-05-10 12:37:42,745] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. + 0: [2023-05-10 12:37:42,745] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. + 0: [2023-05-10 12:37:42,745] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt... + 0: [2023-05-10 12:37:42,745] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt... +23: [2023-05-10 12:37:42,745] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt. +22: [2023-05-10 12:37:42,745] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... + 7: [2023-05-10 12:37:42,745] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. + 7: [2023-05-10 12:37:42,746] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt... + 7: [2023-05-10 12:37:42,746] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. + 5: [2023-05-10 12:37:42,746] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... + 7: [2023-05-10 12:37:42,746] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt... + 5: [2023-05-10 12:37:42,747] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +20: [2023-05-10 12:37:42,747] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt. +20: [2023-05-10 12:37:42,747] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +20: [2023-05-10 12:37:42,747] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +20: [2023-05-10 12:37:42,747] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +20: [2023-05-10 12:37:42,747] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +20: [2023-05-10 12:37:42,747] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +20: [2023-05-10 12:37:42,747] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +20: [2023-05-10 12:37:42,747] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt. +20: [2023-05-10 12:37:42,748] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +20: [2023-05-10 12:37:42,748] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... + 5: [2023-05-10 12:37:42,748] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +15: [2023-05-10 12:37:42,749] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +15: [2023-05-10 12:37:42,749] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +15: [2023-05-10 12:37:42,749] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +15: [2023-05-10 12:37:42,749] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +20: [2023-05-10 12:37:42,749] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt. + 3: [2023-05-10 12:37:42,750] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt. + 3: [2023-05-10 12:37:42,750] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt. +20: [2023-05-10 12:37:42,750] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt. + 3: [2023-05-10 12:37:42,751] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt. + 3: [2023-05-10 12:37:42,751] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt. + 7: [2023-05-10 12:37:42,751] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. + 7: [2023-05-10 12:37:42,751] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. + 7: [2023-05-10 12:37:42,751] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt... + 7: [2023-05-10 12:37:42,751] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt... +15: [2023-05-10 12:37:42,751] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +12: [2023-05-10 12:37:42,751] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +12: [2023-05-10 12:37:42,751] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +12: [2023-05-10 12:37:42,752] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +12: [2023-05-10 12:37:42,752] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... + 2: [2023-05-10 12:37:42,752] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. + 2: [2023-05-10 12:37:42,752] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +15: [2023-05-10 12:37:42,751] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +15: [2023-05-10 12:37:42,751] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... + 4: [2023-05-10 12:37:42,752] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt. + 4: [2023-05-10 12:37:42,752] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt. + 4: [2023-05-10 12:37:42,752] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt. + 4: [2023-05-10 12:37:42,752] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt. +27: [2023-05-10 12:37:42,752] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +27: [2023-05-10 12:37:42,752] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +15: [2023-05-10 12:37:42,753] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... + 9: [2023-05-10 12:37:42,753] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt. + 0: [2023-05-10 12:37:42,753] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. + 0: [2023-05-10 12:37:42,753] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. + 0: [2023-05-10 12:37:42,753] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... + 9: [2023-05-10 12:37:42,753] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt. + 9: [2023-05-10 12:37:42,753] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt. + 0: [2023-05-10 12:37:42,753] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... + 9: [2023-05-10 12:37:42,753] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt. + 8: [2023-05-10 12:37:42,753] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. + 8: [2023-05-10 12:37:42,753] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. + 8: [2023-05-10 12:37:42,753] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. + 8: [2023-05-10 12:37:42,754] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +12: [2023-05-10 12:37:42,754] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +12: [2023-05-10 12:37:42,754] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +27: [2023-05-10 12:37:42,754] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +12: [2023-05-10 12:37:42,754] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +13: [2023-05-10 12:37:42,754] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt. +13: [2023-05-10 12:37:42,754] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt. + 8: [2023-05-10 12:37:42,755] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +14: [2023-05-10 12:37:42,754] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +14: [2023-05-10 12:37:42,754] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +14: [2023-05-10 12:37:42,755] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... + 8: [2023-05-10 12:37:42,755] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. + 8: [2023-05-10 12:37:42,755] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... + 8: [2023-05-10 12:37:42,755] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... + 0: [2023-05-10 12:37:42,755] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. + 0: [2023-05-10 12:37:42,755] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. + 0: [2023-05-10 12:37:42,755] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +14: [2023-05-10 12:37:42,755] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +14: [2023-05-10 12:37:42,755] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +14: [2023-05-10 12:37:42,755] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +14: [2023-05-10 12:37:42,755] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +14: [2023-05-10 12:37:42,755] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt... +14: [2023-05-10 12:37:42,755] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +14: [2023-05-10 12:37:42,755] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +14: [2023-05-10 12:37:42,755] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt... +14: [2023-05-10 12:37:42,755] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +14: [2023-05-10 12:37:42,755] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt... +14: [2023-05-10 12:37:42,755] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt... +14: [2023-05-10 12:37:42,755] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +12: [2023-05-10 12:37:42,755] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +27: [2023-05-10 12:37:42,756] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +22: [2023-05-10 12:37:42,755] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +13: [2023-05-10 12:37:42,756] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt. +13: [2023-05-10 12:37:42,756] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt. +14: [2023-05-10 12:37:42,756] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +27: [2023-05-10 12:37:42,757] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +27: [2023-05-10 12:37:42,757] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +21: [2023-05-10 12:37:42,757] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +21: [2023-05-10 12:37:42,757] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... + 2: [2023-05-10 12:37:42,757] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +18: [2023-05-10 12:37:42,757] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt. +18: [2023-05-10 12:37:42,757] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt. +18: [2023-05-10 12:37:42,757] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt. +21: [2023-05-10 12:37:42,757] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +18: [2023-05-10 12:37:42,757] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt. +27: [2023-05-10 12:37:42,758] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt. +27: [2023-05-10 12:37:42,758] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt. +27: [2023-05-10 12:37:42,758] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt. + 0: [2023-05-10 12:37:42,758] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +21: [2023-05-10 12:37:42,758] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +27: [2023-05-10 12:37:42,758] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt. +21: [2023-05-10 12:37:42,758] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +21: [2023-05-10 12:37:42,759] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +23: [2023-05-10 12:37:42,759] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +23: [2023-05-10 12:37:42,759] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +23: [2023-05-10 12:37:42,759] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +23: [2023-05-10 12:37:42,759] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +27: [2023-05-10 12:37:42,759] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +21: [2023-05-10 12:37:42,759] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +20: [2023-05-10 12:37:42,759] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... + 3: [2023-05-10 12:37:42,760] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +27: [2023-05-10 12:37:42,760] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +21: [2023-05-10 12:37:42,760] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... + 3: [2023-05-10 12:37:42,760] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +20: [2023-05-10 12:37:42,760] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... + 3: [2023-05-10 12:37:42,760] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +25: [2023-05-10 12:37:42,761] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt. +25: [2023-05-10 12:37:42,761] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt. +25: [2023-05-10 12:37:42,761] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt. +25: [2023-05-10 12:37:42,761] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt. +20: [2023-05-10 12:37:42,761] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... + 4: [2023-05-10 12:37:42,761] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... + 4: [2023-05-10 12:37:42,761] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... + 4: [2023-05-10 12:37:42,761] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... + 4: [2023-05-10 12:37:42,761] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... + 3: [2023-05-10 12:37:42,761] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... + 2: [2023-05-10 12:37:42,761] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... + 2: [2023-05-10 12:37:42,761] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... + 9: [2023-05-10 12:37:42,762] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +22: [2023-05-10 12:37:42,762] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +22: [2023-05-10 12:37:42,762] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +20: [2023-05-10 12:37:42,762] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +12: [2023-05-10 12:37:42,763] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt. +16: [2023-05-10 12:37:42,763] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +16: [2023-05-10 12:37:42,763] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +12: [2023-05-10 12:37:42,763] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt. +15: [2023-05-10 12:37:42,763] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt. +15: [2023-05-10 12:37:42,763] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt. +16: [2023-05-10 12:37:42,763] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +16: [2023-05-10 12:37:42,763] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. + 2: [2023-05-10 12:37:42,763] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt. +21: [2023-05-10 12:37:42,763] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +21: [2023-05-10 12:37:42,763] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +12: [2023-05-10 12:37:42,763] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt. +21: [2023-05-10 12:37:42,763] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt... +21: [2023-05-10 12:37:42,763] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt... + 2: [2023-05-10 12:37:42,764] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt. +13: [2023-05-10 12:37:42,764] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +15: [2023-05-10 12:37:42,764] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt. +13: [2023-05-10 12:37:42,764] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +15: [2023-05-10 12:37:42,764] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +13: [2023-05-10 12:37:42,764] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +13: [2023-05-10 12:37:42,764] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. + 9: [2023-05-10 12:37:42,764] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... + 9: [2023-05-10 12:37:42,765] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +16: [2023-05-10 12:37:42,765] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt... +16: [2023-05-10 12:37:42,765] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt... +16: [2023-05-10 12:37:42,765] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt... +16: [2023-05-10 12:37:42,765] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt... + 2: [2023-05-10 12:37:42,765] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt. +12: [2023-05-10 12:37:42,765] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt. +22: [2023-05-10 12:37:42,766] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... + 2: [2023-05-10 12:37:42,766] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... + 9: [2023-05-10 12:37:42,766] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +15: [2023-05-10 12:37:42,766] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt. +18: [2023-05-10 12:37:42,767] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +27: [2023-05-10 12:37:42,767] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +13: [2023-05-10 12:37:42,767] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +14: [2023-05-10 12:37:42,767] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +20: [2023-05-10 12:37:42,767] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +27: [2023-05-10 12:37:42,768] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +18: [2023-05-10 12:37:42,768] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +18: [2023-05-10 12:37:42,768] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +20: [2023-05-10 12:37:42,768] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. + 2: [2023-05-10 12:37:42,768] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. + 2: [2023-05-10 12:37:42,768] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_15-model_01-model_states.pt. +18: [2023-05-10 12:37:42,768] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +27: [2023-05-10 12:37:42,768] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +27: [2023-05-10 12:37:42,769] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +15: [2023-05-10 12:37:42,770] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +15: [2023-05-10 12:37:42,770] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +13: [2023-05-10 12:37:42,770] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +27: [2023-05-10 12:37:42,770] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +25: [2023-05-10 12:37:42,770] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... + 5: [2023-05-10 12:37:42,770] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +14: [2023-05-10 12:37:42,770] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +25: [2023-05-10 12:37:42,771] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... + 5: [2023-05-10 12:37:42,771] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt... +25: [2023-05-10 12:37:42,771] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +25: [2023-05-10 12:37:42,771] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... + 3: [2023-05-10 12:37:42,771] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +12: [2023-05-10 12:37:42,771] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. + 5: [2023-05-10 12:37:42,771] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. + 3: [2023-05-10 12:37:42,772] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt... +14: [2023-05-10 12:37:42,772] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. + 3: [2023-05-10 12:37:42,772] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. + 3: [2023-05-10 12:37:42,772] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt... +21: [2023-05-10 12:37:42,772] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. + 5: [2023-05-10 12:37:42,773] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt... +23: [2023-05-10 12:37:42,772] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +12: [2023-05-10 12:37:42,773] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +23: [2023-05-10 12:37:42,773] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt... +20: [2023-05-10 12:37:42,773] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. + 3: [2023-05-10 12:37:42,773] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. + 3: [2023-05-10 12:37:42,774] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt... +12: [2023-05-10 12:37:42,774] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +12: [2023-05-10 12:37:42,774] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +20: [2023-05-10 12:37:42,774] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt... +13: [2023-05-10 12:37:42,774] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... + 2: [2023-05-10 12:37:42,774] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +12: [2023-05-10 12:37:42,774] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +23: [2023-05-10 12:37:42,775] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +23: [2023-05-10 12:37:42,775] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. + 9: [2023-05-10 12:37:42,775] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +23: [2023-05-10 12:37:42,775] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt... +23: [2023-05-10 12:37:42,775] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt... +13: [2023-05-10 12:37:42,775] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +20: [2023-05-10 12:37:42,775] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +20: [2023-05-10 12:37:42,775] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. + 8: [2023-05-10 12:37:42,775] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. + 8: [2023-05-10 12:37:42,775] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +21: [2023-05-10 12:37:42,775] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +22: [2023-05-10 12:37:42,775] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +22: [2023-05-10 12:37:42,775] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... + 2: [2023-05-10 12:37:42,775] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... + 5: [2023-05-10 12:37:42,775] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +15: [2023-05-10 12:37:42,775] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +21: [2023-05-10 12:37:42,775] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt... +15: [2023-05-10 12:37:42,776] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +21: [2023-05-10 12:37:42,776] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. + 4: [2023-05-10 12:37:42,776] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. + 9: [2023-05-10 12:37:42,777] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt... +21: [2023-05-10 12:37:42,777] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt... +15: [2023-05-10 12:37:42,777] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... + 5: [2023-05-10 12:37:42,777] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt... +27: [2023-05-10 12:37:42,777] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... + 4: [2023-05-10 12:37:42,777] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt... +13: [2023-05-10 12:37:42,777] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +13: [2023-05-10 12:37:42,777] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +15: [2023-05-10 12:37:42,777] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... + 4: [2023-05-10 12:37:42,777] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. + 4: [2023-05-10 12:37:42,777] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. + 4: [2023-05-10 12:37:42,777] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +15: [2023-05-10 12:37:42,777] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... + 4: [2023-05-10 12:37:42,778] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt... + 4: [2023-05-10 12:37:42,778] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt... + 4: [2023-05-10 12:37:42,778] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt... + 2: [2023-05-10 12:37:42,778] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +12: [2023-05-10 12:37:42,778] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +23: [2023-05-10 12:37:42,778] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +23: [2023-05-10 12:37:42,778] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt... + 2: [2023-05-10 12:37:42,779] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +22: [2023-05-10 12:37:42,779] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +21: [2023-05-10 12:37:42,779] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +12: [2023-05-10 12:37:42,779] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... +20: [2023-05-10 12:37:42,779] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +20: [2023-05-10 12:37:42,779] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... + 5: [2023-05-10 12:37:42,780] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +14: [2023-05-10 12:37:42,780] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... + 2: [2023-05-10 12:37:42,780] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt... + 9: [2023-05-10 12:37:42,780] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. + 9: [2023-05-10 12:37:42,780] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt... +27: [2023-05-10 12:37:42,781] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +15: [2023-05-10 12:37:42,781] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +15: [2023-05-10 12:37:42,781] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +13: [2023-05-10 12:37:42,781] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... + 8: [2023-05-10 12:37:42,780] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. + 5: [2023-05-10 12:37:42,782] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt... + 0: [2023-05-10 12:37:42,782] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +21: [2023-05-10 12:37:42,782] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +25: [2023-05-10 12:37:42,782] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. + 0: [2023-05-10 12:37:42,782] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +20: [2023-05-10 12:37:42,782] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +27: [2023-05-10 12:37:42,782] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt... +14: [2023-05-10 12:37:42,782] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +14: [2023-05-10 12:37:42,782] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +20: [2023-05-10 12:37:42,782] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt... +14: [2023-05-10 12:37:42,782] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +25: [2023-05-10 12:37:42,782] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt... +13: [2023-05-10 12:37:42,783] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. + 0: [2023-05-10 12:37:42,783] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +18: [2023-05-10 12:37:42,783] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +18: [2023-05-10 12:37:42,783] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +25: [2023-05-10 12:37:42,784] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +25: [2023-05-10 12:37:42,784] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt... +18: [2023-05-10 12:37:42,784] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +13: [2023-05-10 12:37:42,784] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt... +13: [2023-05-10 12:37:42,784] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +18: [2023-05-10 12:37:42,785] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt... +18: [2023-05-10 12:37:42,785] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt... +18: [2023-05-10 12:37:42,785] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt... + 8: [2023-05-10 12:37:42,785] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +20: [2023-05-10 12:37:42,785] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +15: [2023-05-10 12:37:42,785] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. + 8: [2023-05-10 12:37:42,786] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +12: [2023-05-10 12:37:42,786] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +13: [2023-05-10 12:37:42,786] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +13: [2023-05-10 12:37:42,786] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt... +12: [2023-05-10 12:37:42,786] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +20: [2023-05-10 12:37:42,786] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +27: [2023-05-10 12:37:42,786] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +27: [2023-05-10 12:37:42,787] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt... +20: [2023-05-10 12:37:42,787] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +20: [2023-05-10 12:37:42,787] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt... + 9: [2023-05-10 12:37:42,787] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +22: [2023-05-10 12:37:42,788] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... + 9: [2023-05-10 12:37:42,788] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt... +25: [2023-05-10 12:37:42,787] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +25: [2023-05-10 12:37:42,787] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +25: [2023-05-10 12:37:42,788] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt... +25: [2023-05-10 12:37:42,788] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt... +12: [2023-05-10 12:37:42,789] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +12: [2023-05-10 12:37:42,789] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +20: [2023-05-10 12:37:42,789] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +20: [2023-05-10 12:37:42,789] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt... +27: [2023-05-10 12:37:42,789] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +27: [2023-05-10 12:37:42,789] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt... + 8: [2023-05-10 12:37:42,790] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +28: [2023-05-10 12:37:42,790] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. + 8: [2023-05-10 12:37:42,790] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +28: [2023-05-10 12:37:42,790] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +27: [2023-05-10 12:37:42,790] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +28: [2023-05-10 12:37:42,790] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +28: [2023-05-10 12:37:42,790] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +28: [2023-05-10 12:37:42,790] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +28: [2023-05-10 12:37:42,790] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. + 3: [2023-05-10 12:37:42,790] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +27: [2023-05-10 12:37:42,790] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. + 2: [2023-05-10 12:37:42,790] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +21: [2023-05-10 12:37:42,791] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... + 2: [2023-05-10 12:37:42,791] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt... +27: [2023-05-10 12:37:42,791] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. + 3: [2023-05-10 12:37:42,791] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt... +18: [2023-05-10 12:37:42,791] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +18: [2023-05-10 12:37:42,791] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt... +28: [2023-05-10 12:37:42,792] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +28: [2023-05-10 12:37:42,792] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +21: [2023-05-10 12:37:42,792] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +12: [2023-05-10 12:37:42,792] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. + 9: [2023-05-10 12:37:42,792] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +14: [2023-05-10 12:37:42,793] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +12: [2023-05-10 12:37:42,793] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. + 2: [2023-05-10 12:37:42,793] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +21: [2023-05-10 12:37:42,793] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. + 2: [2023-05-10 12:37:42,793] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt... +12: [2023-05-10 12:37:42,793] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt... +12: [2023-05-10 12:37:42,793] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt... + 9: [2023-05-10 12:37:42,794] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt... + 0: [2023-05-10 12:37:42,794] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... + 0: [2023-05-10 12:37:42,794] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +15: [2023-05-10 12:37:42,794] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +15: [2023-05-10 12:37:42,794] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... + 2: [2023-05-10 12:37:42,794] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. + 2: [2023-05-10 12:37:42,795] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt... +15: [2023-05-10 12:37:42,795] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +15: [2023-05-10 12:37:42,795] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt... +15: [2023-05-10 12:37:42,795] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt... + 0: [2023-05-10 12:37:42,796] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... + 2: [2023-05-10 12:37:42,796] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. + 2: [2023-05-10 12:37:42,796] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt... +13: [2023-05-10 12:37:42,796] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +13: [2023-05-10 12:37:42,797] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt... +15: [2023-05-10 12:37:42,797] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +15: [2023-05-10 12:37:42,797] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +15: [2023-05-10 12:37:42,797] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt... +15: [2023-05-10 12:37:42,797] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt... +12: [2023-05-10 12:37:42,797] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +27: [2023-05-10 12:37:42,799] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... + 8: [2023-05-10 12:37:42,799] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +27: [2023-05-10 12:37:42,801] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... + 8: [2023-05-10 12:37:42,801] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt. + 8: [2023-05-10 12:37:42,801] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt. +21: [2023-05-10 12:37:42,801] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... + 8: [2023-05-10 12:37:42,801] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt. +27: [2023-05-10 12:37:42,801] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +27: [2023-05-10 12:37:42,801] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +28: [2023-05-10 12:37:42,801] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +21: [2023-05-10 12:37:42,802] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... + 8: [2023-05-10 12:37:42,802] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt. +12: [2023-05-10 12:37:42,802] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +12: [2023-05-10 12:37:42,802] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt... +13: [2023-05-10 12:37:42,802] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +27: [2023-05-10 12:37:42,803] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt... +17: [2023-05-10 12:37:42,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt. +17: [2023-05-10 12:37:42,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt. +17: [2023-05-10 12:37:42,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt. +13: [2023-05-10 12:37:42,804] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt... + 0: [2023-05-10 12:37:42,804] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +12: [2023-05-10 12:37:42,804] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_00-model_states.pt. +17: [2023-05-10 12:37:42,805] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt. +28: [2023-05-10 12:37:42,805] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +12: [2023-05-10 12:37:42,806] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt... +11: [2023-05-10 12:37:42,806] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +11: [2023-05-10 12:37:42,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +11: [2023-05-10 12:37:42,807] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +11: [2023-05-10 12:37:42,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +16: [2023-05-10 12:37:42,807] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +16: [2023-05-10 12:37:42,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +11: [2023-05-10 12:37:42,808] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +11: [2023-05-10 12:37:42,808] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +16: [2023-05-10 12:37:42,808] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +16: [2023-05-10 12:37:42,809] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. + 5: [2023-05-10 12:37:42,809] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. + 5: [2023-05-10 12:37:42,809] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +16: [2023-05-10 12:37:42,809] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +16: [2023-05-10 12:37:42,809] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... + 5: [2023-05-10 12:37:42,809] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +16: [2023-05-10 12:37:42,809] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +11: [2023-05-10 12:37:42,809] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +11: [2023-05-10 12:37:42,809] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +16: [2023-05-10 12:37:42,809] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... + 8: [2023-05-10 12:37:42,810] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... + 5: [2023-05-10 12:37:42,810] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. + 5: [2023-05-10 12:37:42,810] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. + 5: [2023-05-10 12:37:42,810] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... + 5: [2023-05-10 12:37:42,810] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +28: [2023-05-10 12:37:42,811] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... + 5: [2023-05-10 12:37:42,812] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... + 8: [2023-05-10 12:37:42,812] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... + 8: [2023-05-10 12:37:42,812] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +26: [2023-05-10 12:37:42,813] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt. +26: [2023-05-10 12:37:42,813] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt. +26: [2023-05-10 12:37:42,814] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt. +26: [2023-05-10 12:37:42,814] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt. + 0: [2023-05-10 12:37:42,814] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +17: [2023-05-10 12:37:42,815] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +17: [2023-05-10 12:37:42,815] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +11: [2023-05-10 12:37:42,815] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt. +17: [2023-05-10 12:37:42,815] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... + 8: [2023-05-10 12:37:42,813] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +24: [2023-05-10 12:37:42,815] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt. +24: [2023-05-10 12:37:42,815] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt. +24: [2023-05-10 12:37:42,815] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt. +24: [2023-05-10 12:37:42,815] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt. + 1: [2023-05-10 12:37:42,816] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt. + 1: [2023-05-10 12:37:42,816] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt. + 1: [2023-05-10 12:37:42,816] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt. + 1: [2023-05-10 12:37:42,816] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt. +11: [2023-05-10 12:37:42,817] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt. +11: [2023-05-10 12:37:42,817] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt. +28: [2023-05-10 12:37:42,818] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +17: [2023-05-10 12:37:42,818] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +11: [2023-05-10 12:37:42,818] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt. +16: [2023-05-10 12:37:42,820] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +26: [2023-05-10 12:37:42,823] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +16: [2023-05-10 12:37:42,822] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. + 8: [2023-05-10 12:37:42,823] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. + 8: [2023-05-10 12:37:42,824] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt... +26: [2023-05-10 12:37:42,824] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... + 5: [2023-05-10 12:37:42,824] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +26: [2023-05-10 12:37:42,824] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +24: [2023-05-10 12:37:42,824] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +26: [2023-05-10 12:37:42,824] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +11: [2023-05-10 12:37:42,825] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +28: [2023-05-10 12:37:42,824] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +28: [2023-05-10 12:37:42,824] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +24: [2023-05-10 12:37:42,825] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +11: [2023-05-10 12:37:42,825] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +11: [2023-05-10 12:37:42,825] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +24: [2023-05-10 12:37:42,826] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +16: [2023-05-10 12:37:42,826] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. + 1: [2023-05-10 12:37:42,827] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... + 1: [2023-05-10 12:37:42,827] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +24: [2023-05-10 12:37:42,827] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... + 5: [2023-05-10 12:37:42,828] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +11: [2023-05-10 12:37:42,828] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +11: [2023-05-10 12:37:42,829] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... + 1: [2023-05-10 12:37:42,830] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... + 1: [2023-05-10 12:37:42,830] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +16: [2023-05-10 12:37:42,831] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +11: [2023-05-10 12:37:42,831] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... + 8: [2023-05-10 12:37:42,831] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +17: [2023-05-10 12:37:42,832] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. + 8: [2023-05-10 12:37:42,832] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. + 8: [2023-05-10 12:37:42,832] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt... +17: [2023-05-10 12:37:42,832] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt... + 8: [2023-05-10 12:37:42,832] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt... +17: [2023-05-10 12:37:42,833] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +17: [2023-05-10 12:37:42,833] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt... +28: [2023-05-10 12:37:42,833] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +28: [2023-05-10 12:37:42,833] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +16: [2023-05-10 12:37:42,834] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... + 5: [2023-05-10 12:37:42,835] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +11: [2023-05-10 12:37:42,836] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... + 5: [2023-05-10 12:37:42,836] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +11: [2023-05-10 12:37:42,836] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +16: [2023-05-10 12:37:42,837] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +11: [2023-05-10 12:37:42,837] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. + 8: [2023-05-10 12:37:42,838] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +11: [2023-05-10 12:37:42,838] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt... + 5: [2023-05-10 12:37:42,838] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +17: [2023-05-10 12:37:42,839] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. + 8: [2023-05-10 12:37:42,840] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt... +26: [2023-05-10 12:37:42,840] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +17: [2023-05-10 12:37:42,841] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt... +26: [2023-05-10 12:37:42,841] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt... +11: [2023-05-10 12:37:42,841] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. + 1: [2023-05-10 12:37:42,841] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. + 1: [2023-05-10 12:37:42,842] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt... +26: [2023-05-10 12:37:42,842] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +26: [2023-05-10 12:37:42,842] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +26: [2023-05-10 12:37:42,842] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt... +26: [2023-05-10 12:37:42,842] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt... + 1: [2023-05-10 12:37:42,842] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. + 1: [2023-05-10 12:37:42,842] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt... +16: [2023-05-10 12:37:42,842] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. + 1: [2023-05-10 12:37:42,845] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. + 1: [2023-05-10 12:37:42,845] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt... + 5: [2023-05-10 12:37:42,845] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +11: [2023-05-10 12:37:42,845] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +11: [2023-05-10 12:37:42,845] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +11: [2023-05-10 12:37:42,845] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt... +11: [2023-05-10 12:37:42,845] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt... +11: [2023-05-10 12:37:42,845] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +26: [2023-05-10 12:37:42,845] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +17: [2023-05-10 12:37:42,845] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. + 5: [2023-05-10 12:37:42,846] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +24: [2023-05-10 12:37:42,846] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +24: [2023-05-10 12:37:42,846] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +26: [2023-05-10 12:37:42,847] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt... +24: [2023-05-10 12:37:42,847] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt... +24: [2023-05-10 12:37:42,847] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt... +17: [2023-05-10 12:37:42,847] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt... + 1: [2023-05-10 12:37:42,849] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. + 1: [2023-05-10 12:37:42,850] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt... +10: [2023-05-10 12:37:42,850] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt. +10: [2023-05-10 12:37:42,851] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt. +16: [2023-05-10 12:37:42,851] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +10: [2023-05-10 12:37:42,851] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt. +11: [2023-05-10 12:37:42,851] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +24: [2023-05-10 12:37:42,851] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +10: [2023-05-10 12:37:42,852] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt. +24: [2023-05-10 12:37:42,853] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt... +24: [2023-05-10 12:37:42,854] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +11: [2023-05-10 12:37:42,855] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... + 5: [2023-05-10 12:37:42,855] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +24: [2023-05-10 12:37:42,856] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt... +10: [2023-05-10 12:37:42,860] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +25: [2023-05-10 12:37:42,860] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +10: [2023-05-10 12:37:42,860] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +25: [2023-05-10 12:37:42,860] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +25: [2023-05-10 12:37:42,860] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +25: [2023-05-10 12:37:42,860] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +25: [2023-05-10 12:37:42,860] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +25: [2023-05-10 12:37:42,860] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +25: [2023-05-10 12:37:42,860] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... + 5: [2023-05-10 12:37:42,862] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt. +25: [2023-05-10 12:37:42,862] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... + 5: [2023-05-10 12:37:42,863] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt. +11: [2023-05-10 12:37:42,863] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +10: [2023-05-10 12:37:42,864] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +10: [2023-05-10 12:37:42,864] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... + 5: [2023-05-10 12:37:42,865] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt. +11: [2023-05-10 12:37:42,865] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt... + 5: [2023-05-10 12:37:42,866] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt. +17: [2023-05-10 12:37:42,866] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +17: [2023-05-10 12:37:42,866] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +17: [2023-05-10 12:37:42,867] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +17: [2023-05-10 12:37:42,866] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +17: [2023-05-10 12:37:42,867] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +17: [2023-05-10 12:37:42,867] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. + 3: [2023-05-10 12:37:42,868] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. + 3: [2023-05-10 12:37:42,868] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. + 3: [2023-05-10 12:37:42,868] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... + 3: [2023-05-10 12:37:42,868] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +17: [2023-05-10 12:37:42,868] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... + 3: [2023-05-10 12:37:42,868] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +17: [2023-05-10 12:37:42,868] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... + 7: [2023-05-10 12:37:42,868] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. + 7: [2023-05-10 12:37:42,868] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. + 7: [2023-05-10 12:37:42,868] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. + 7: [2023-05-10 12:37:42,869] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... + 7: [2023-05-10 12:37:42,869] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... + 7: [2023-05-10 12:37:42,869] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... + 4: [2023-05-10 12:37:42,869] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. + 4: [2023-05-10 12:37:42,869] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. + 4: [2023-05-10 12:37:42,869] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. + 4: [2023-05-10 12:37:42,869] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... + 4: [2023-05-10 12:37:42,869] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... + 4: [2023-05-10 12:37:42,869] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... + 4: [2023-05-10 12:37:42,869] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. + 7: [2023-05-10 12:37:42,870] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. + 3: [2023-05-10 12:37:42,870] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... + 7: [2023-05-10 12:37:42,870] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... + 3: [2023-05-10 12:37:42,870] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... + 3: [2023-05-10 12:37:42,871] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +25: [2023-05-10 12:37:42,872] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. + 4: [2023-05-10 12:37:42,872] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +25: [2023-05-10 12:37:42,872] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. + 5: [2023-05-10 12:37:42,872] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... + 5: [2023-05-10 12:37:42,872] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +25: [2023-05-10 12:37:42,874] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. + 5: [2023-05-10 12:37:42,877] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... + 5: [2023-05-10 12:37:42,877] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +10: [2023-05-10 12:37:42,878] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. + 0: [2023-05-10 12:37:42,878] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt. + 0: [2023-05-10 12:37:42,878] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt. + 0: [2023-05-10 12:37:42,878] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt. + 0: [2023-05-10 12:37:42,878] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt. +10: [2023-05-10 12:37:42,879] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt... +10: [2023-05-10 12:37:42,880] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +10: [2023-05-10 12:37:42,880] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt... +17: [2023-05-10 12:37:42,880] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. + 7: [2023-05-10 12:37:42,880] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt. + 7: [2023-05-10 12:37:42,881] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt. + 7: [2023-05-10 12:37:42,881] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt. +25: [2023-05-10 12:37:42,881] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +21: [2023-05-10 12:37:42,881] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt. +21: [2023-05-10 12:37:42,881] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt. + 4: [2023-05-10 12:37:42,882] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +21: [2023-05-10 12:37:42,882] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt. +21: [2023-05-10 12:37:42,882] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt. +17: [2023-05-10 12:37:42,883] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +16: [2023-05-10 12:37:42,883] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt. +16: [2023-05-10 12:37:42,883] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt. +16: [2023-05-10 12:37:42,883] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt. +16: [2023-05-10 12:37:42,883] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt. +25: [2023-05-10 12:37:42,884] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +25: [2023-05-10 12:37:42,885] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... + 3: [2023-05-10 12:37:42,885] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. + 4: [2023-05-10 12:37:42,884] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. + 7: [2023-05-10 12:37:42,885] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt. + 4: [2023-05-10 12:37:42,886] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. + 0: [2023-05-10 12:37:42,888] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... + 7: [2023-05-10 12:37:42,888] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. + 0: [2023-05-10 12:37:42,889] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +10: [2023-05-10 12:37:42,889] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. + 0: [2023-05-10 12:37:42,890] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... + 5: [2023-05-10 12:37:42,890] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +17: [2023-05-10 12:37:42,890] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... + 5: [2023-05-10 12:37:42,890] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt... + 0: [2023-05-10 12:37:42,891] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... + 4: [2023-05-10 12:37:42,891] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +21: [2023-05-10 12:37:42,891] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +10: [2023-05-10 12:37:42,891] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +10: [2023-05-10 12:37:42,891] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt... +21: [2023-05-10 12:37:42,891] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... + 7: [2023-05-10 12:37:42,891] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +24: [2023-05-10 12:37:42,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +24: [2023-05-10 12:37:42,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +25: [2023-05-10 12:37:42,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +24: [2023-05-10 12:37:42,892] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +24: [2023-05-10 12:37:42,892] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +24: [2023-05-10 12:37:42,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +24: [2023-05-10 12:37:42,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +10: [2023-05-10 12:37:42,893] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt... +21: [2023-05-10 12:37:42,893] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +24: [2023-05-10 12:37:42,894] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +17: [2023-05-10 12:37:42,894] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... + 3: [2023-05-10 12:37:42,894] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. + 7: [2023-05-10 12:37:42,894] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... + 7: [2023-05-10 12:37:42,894] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... + 3: [2023-05-10 12:37:42,894] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +24: [2023-05-10 12:37:42,894] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... + 7: [2023-05-10 12:37:42,894] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. + 4: [2023-05-10 12:37:42,895] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... + 7: [2023-05-10 12:37:42,895] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. + 7: [2023-05-10 12:37:42,895] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +16: [2023-05-10 12:37:42,895] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +21: [2023-05-10 12:37:42,895] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +16: [2023-05-10 12:37:42,895] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +16: [2023-05-10 12:37:42,895] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... + 5: [2023-05-10 12:37:42,896] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. + 5: [2023-05-10 12:37:42,896] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. + 5: [2023-05-10 12:37:42,896] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt... + 5: [2023-05-10 12:37:42,896] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt... +16: [2023-05-10 12:37:42,896] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +17: [2023-05-10 12:37:42,896] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +17: [2023-05-10 12:37:42,897] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. + 5: [2023-05-10 12:37:42,897] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. + 5: [2023-05-10 12:37:42,897] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt... + 7: [2023-05-10 12:37:42,898] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... + 4: [2023-05-10 12:37:42,899] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +25: [2023-05-10 12:37:42,901] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... + 7: [2023-05-10 12:37:42,901] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... + 3: [2023-05-10 12:37:42,901] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. + 3: [2023-05-10 12:37:42,902] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... + 0: [2023-05-10 12:37:42,904] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +31: [2023-05-10 12:37:42,905] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +31: [2023-05-10 12:37:42,905] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +31: [2023-05-10 12:37:42,905] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +31: [2023-05-10 12:37:42,905] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +17: [2023-05-10 12:37:42,905] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... + 3: [2023-05-10 12:37:42,905] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. + 9: [2023-05-10 12:37:42,906] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +24: [2023-05-10 12:37:42,906] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. + 9: [2023-05-10 12:37:42,906] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +17: [2023-05-10 12:37:42,906] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... + 9: [2023-05-10 12:37:42,906] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. + 9: [2023-05-10 12:37:42,906] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. + 7: [2023-05-10 12:37:42,906] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +31: [2023-05-10 12:37:42,906] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +31: [2023-05-10 12:37:42,906] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. + 7: [2023-05-10 12:37:42,906] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... + 9: [2023-05-10 12:37:42,906] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... + 9: [2023-05-10 12:37:42,906] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... + 9: [2023-05-10 12:37:42,906] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +21: [2023-05-10 12:37:42,906] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +21: [2023-05-10 12:37:42,906] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. + 0: [2023-05-10 12:37:42,907] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt... +21: [2023-05-10 12:37:42,907] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt... +21: [2023-05-10 12:37:42,907] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt... +24: [2023-05-10 12:37:42,907] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. + 7: [2023-05-10 12:37:42,907] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. + 7: [2023-05-10 12:37:42,907] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt... + 7: [2023-05-10 12:37:42,908] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... + 9: [2023-05-10 12:37:42,908] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +31: [2023-05-10 12:37:42,908] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... + 4: [2023-05-10 12:37:42,908] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +31: [2023-05-10 12:37:42,908] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... + 3: [2023-05-10 12:37:42,911] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +16: [2023-05-10 12:37:42,911] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +16: [2023-05-10 12:37:42,911] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt... +16: [2023-05-10 12:37:42,913] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +16: [2023-05-10 12:37:42,913] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +16: [2023-05-10 12:37:42,913] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt... +16: [2023-05-10 12:37:42,913] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt... +24: [2023-05-10 12:37:42,915] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... + 3: [2023-05-10 12:37:42,915] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +24: [2023-05-10 12:37:42,916] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... + 4: [2023-05-10 12:37:42,916] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +31: [2023-05-10 12:37:42,917] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. + 0: [2023-05-10 12:37:42,918] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. + 9: [2023-05-10 12:37:42,918] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +24: [2023-05-10 12:37:42,918] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. + 0: [2023-05-10 12:37:42,919] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt... + 9: [2023-05-10 12:37:42,919] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. + 9: [2023-05-10 12:37:42,920] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +29: [2023-05-10 12:37:42,920] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt. +29: [2023-05-10 12:37:42,920] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt. +29: [2023-05-10 12:37:42,920] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt. +29: [2023-05-10 12:37:42,920] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt. +21: [2023-05-10 12:37:42,921] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. + 4: [2023-05-10 12:37:42,921] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt. + 4: [2023-05-10 12:37:42,921] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt. + 4: [2023-05-10 12:37:42,921] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt. +16: [2023-05-10 12:37:42,921] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. + 3: [2023-05-10 12:37:42,922] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt. + 3: [2023-05-10 12:37:42,922] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt. + 3: [2023-05-10 12:37:42,922] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt. +23: [2023-05-10 12:37:42,922] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt. +23: [2023-05-10 12:37:42,922] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt. +23: [2023-05-10 12:37:42,922] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt. + 4: [2023-05-10 12:37:42,922] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt. +24: [2023-05-10 12:37:42,922] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +23: [2023-05-10 12:37:42,922] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt. +18: [2023-05-10 12:37:42,922] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt. +18: [2023-05-10 12:37:42,922] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt. +18: [2023-05-10 12:37:42,922] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt. +16: [2023-05-10 12:37:42,922] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt... +31: [2023-05-10 12:37:42,922] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +18: [2023-05-10 12:37:42,922] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt. +21: [2023-05-10 12:37:42,923] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt... + 3: [2023-05-10 12:37:42,923] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt. + 0: [2023-05-10 12:37:42,923] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. + 0: [2023-05-10 12:37:42,923] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. + 7: [2023-05-10 12:37:42,924] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. + 7: [2023-05-10 12:37:42,925] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt... + 0: [2023-05-10 12:37:42,926] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt... + 0: [2023-05-10 12:37:42,926] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt... + 7: [2023-05-10 12:37:42,926] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +21: [2023-05-10 12:37:42,926] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +29: [2023-05-10 12:37:42,926] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +29: [2023-05-10 12:37:42,927] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +31: [2023-05-10 12:37:42,927] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +24: [2023-05-10 12:37:42,927] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +29: [2023-05-10 12:37:42,927] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +29: [2023-05-10 12:37:42,928] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... + 9: [2023-05-10 12:37:42,928] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... + 7: [2023-05-10 12:37:42,928] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt... +29: [2023-05-10 12:37:42,928] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +29: [2023-05-10 12:37:42,928] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +29: [2023-05-10 12:37:42,928] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +29: [2023-05-10 12:37:42,928] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +21: [2023-05-10 12:37:42,929] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt... +29: [2023-05-10 12:37:42,930] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +29: [2023-05-10 12:37:42,931] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +31: [2023-05-10 12:37:42,931] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... + 9: [2023-05-10 12:37:42,931] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +23: [2023-05-10 12:37:42,932] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +24: [2023-05-10 12:37:42,932] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... + 6: [2023-05-10 12:37:42,932] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. + 6: [2023-05-10 12:37:42,932] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. + 6: [2023-05-10 12:37:42,932] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. + 6: [2023-05-10 12:37:42,932] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... + 6: [2023-05-10 12:37:42,932] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... + 6: [2023-05-10 12:37:42,932] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... + 6: [2023-05-10 12:37:42,932] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. + 3: [2023-05-10 12:37:42,932] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +29: [2023-05-10 12:37:42,932] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... + 6: [2023-05-10 12:37:42,932] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... + 3: [2023-05-10 12:37:42,932] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... + 3: [2023-05-10 12:37:42,933] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +22: [2023-05-10 12:37:42,933] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt. + 4: [2023-05-10 12:37:42,933] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +22: [2023-05-10 12:37:42,933] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt. +22: [2023-05-10 12:37:42,933] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt. + 4: [2023-05-10 12:37:42,933] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... + 3: [2023-05-10 12:37:42,933] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +18: [2023-05-10 12:37:42,933] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +18: [2023-05-10 12:37:42,933] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... + 9: [2023-05-10 12:37:42,933] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... + 7: [2023-05-10 12:37:42,933] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +23: [2023-05-10 12:37:42,934] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +18: [2023-05-10 12:37:42,933] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +18: [2023-05-10 12:37:42,934] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +23: [2023-05-10 12:37:42,934] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +22: [2023-05-10 12:37:42,934] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt. +29: [2023-05-10 12:37:42,934] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +23: [2023-05-10 12:37:42,934] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +31: [2023-05-10 12:37:42,934] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. + 4: [2023-05-10 12:37:42,936] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... + 7: [2023-05-10 12:37:42,935] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt... + 4: [2023-05-10 12:37:42,936] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... + 9: [2023-05-10 12:37:42,936] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +30: [2023-05-10 12:37:42,940] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt. +30: [2023-05-10 12:37:42,940] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt. +30: [2023-05-10 12:37:42,940] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt. +31: [2023-05-10 12:37:42,940] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +29: [2023-05-10 12:37:42,940] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +30: [2023-05-10 12:37:42,941] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt. +28: [2023-05-10 12:37:42,942] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt. +28: [2023-05-10 12:37:42,942] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt. +28: [2023-05-10 12:37:42,942] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt. +31: [2023-05-10 12:37:42,944] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +28: [2023-05-10 12:37:42,943] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt. +22: [2023-05-10 12:37:42,944] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +22: [2023-05-10 12:37:42,944] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... + 9: [2023-05-10 12:37:42,945] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +23: [2023-05-10 12:37:42,944] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +23: [2023-05-10 12:37:42,945] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt... +22: [2023-05-10 12:37:42,946] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +18: [2023-05-10 12:37:42,947] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +22: [2023-05-10 12:37:42,947] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +18: [2023-05-10 12:37:42,947] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt... + 3: [2023-05-10 12:37:42,947] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +25: [2023-05-10 12:37:42,948] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt. + 6: [2023-05-10 12:37:42,948] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. + 6: [2023-05-10 12:37:42,948] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. + 3: [2023-05-10 12:37:42,948] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt... +25: [2023-05-10 12:37:42,948] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt. +25: [2023-05-10 12:37:42,948] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt. +25: [2023-05-10 12:37:42,948] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt. +18: [2023-05-10 12:37:42,948] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +18: [2023-05-10 12:37:42,948] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt... + 6: [2023-05-10 12:37:42,948] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. + 6: [2023-05-10 12:37:42,948] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +31: [2023-05-10 12:37:42,949] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +30: [2023-05-10 12:37:42,950] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +30: [2023-05-10 12:37:42,950] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +30: [2023-05-10 12:37:42,951] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +29: [2023-05-10 12:37:42,951] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +30: [2023-05-10 12:37:42,952] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +29: [2023-05-10 12:37:42,952] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +29: [2023-05-10 12:37:42,952] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. + 4: [2023-05-10 12:37:42,952] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. + 4: [2023-05-10 12:37:42,952] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. + 3: [2023-05-10 12:37:42,953] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. + 3: [2023-05-10 12:37:42,953] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt... + 4: [2023-05-10 12:37:42,953] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt... + 4: [2023-05-10 12:37:42,953] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt... +29: [2023-05-10 12:37:42,953] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +29: [2023-05-10 12:37:42,954] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +29: [2023-05-10 12:37:42,954] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +18: [2023-05-10 12:37:42,954] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +18: [2023-05-10 12:37:42,954] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt... +28: [2023-05-10 12:37:42,954] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +29: [2023-05-10 12:37:42,954] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt... +29: [2023-05-10 12:37:42,954] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt... +28: [2023-05-10 12:37:42,954] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +28: [2023-05-10 12:37:42,955] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +28: [2023-05-10 12:37:42,955] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... + 3: [2023-05-10 12:37:42,956] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. + 3: [2023-05-10 12:37:42,956] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +13: [2023-05-10 12:37:42,956] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt. +13: [2023-05-10 12:37:42,957] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt. +13: [2023-05-10 12:37:42,957] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt. +23: [2023-05-10 12:37:42,957] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +13: [2023-05-10 12:37:42,957] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt. +25: [2023-05-10 12:37:42,957] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +23: [2023-05-10 12:37:42,958] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. + 6: [2023-05-10 12:37:42,958] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... + 6: [2023-05-10 12:37:42,958] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... + 3: [2023-05-10 12:37:42,958] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt... +18: [2023-05-10 12:37:42,958] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. + 3: [2023-05-10 12:37:42,958] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt... + 6: [2023-05-10 12:37:42,958] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... + 6: [2023-05-10 12:37:42,958] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +23: [2023-05-10 12:37:42,959] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt... +25: [2023-05-10 12:37:42,959] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +25: [2023-05-10 12:37:42,959] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +25: [2023-05-10 12:37:42,959] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... + 6: [2023-05-10 12:37:42,959] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt. +23: [2023-05-10 12:37:42,959] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt... +18: [2023-05-10 12:37:42,959] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt... + 6: [2023-05-10 12:37:42,959] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt. + 6: [2023-05-10 12:37:42,959] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt. +23: [2023-05-10 12:37:42,959] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. + 4: [2023-05-10 12:37:42,960] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +29: [2023-05-10 12:37:42,961] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. + 4: [2023-05-10 12:37:42,961] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +29: [2023-05-10 12:37:42,961] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt... +23: [2023-05-10 12:37:42,961] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt... +10: [2023-05-10 12:37:42,961] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +10: [2023-05-10 12:37:42,961] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +10: [2023-05-10 12:37:42,961] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +10: [2023-05-10 12:37:42,961] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +10: [2023-05-10 12:37:42,961] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +10: [2023-05-10 12:37:42,961] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... + 4: [2023-05-10 12:37:42,962] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt... +10: [2023-05-10 12:37:42,962] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. + 6: [2023-05-10 12:37:42,962] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt. + 4: [2023-05-10 12:37:42,962] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt... +29: [2023-05-10 12:37:42,963] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +29: [2023-05-10 12:37:42,963] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +27: [2023-05-10 12:37:42,963] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt. +27: [2023-05-10 12:37:42,963] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt. +27: [2023-05-10 12:37:42,963] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt. +29: [2023-05-10 12:37:42,964] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +10: [2023-05-10 12:37:42,964] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +28: [2023-05-10 12:37:42,965] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +28: [2023-05-10 12:37:42,966] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt... +13: [2023-05-10 12:37:42,966] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +27: [2023-05-10 12:37:42,966] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt. +13: [2023-05-10 12:37:42,967] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +13: [2023-05-10 12:37:42,967] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +13: [2023-05-10 12:37:42,967] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +28: [2023-05-10 12:37:42,967] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. + 6: [2023-05-10 12:37:42,968] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +28: [2023-05-10 12:37:42,968] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt... + 6: [2023-05-10 12:37:42,969] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +28: [2023-05-10 12:37:42,969] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +28: [2023-05-10 12:37:42,969] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +28: [2023-05-10 12:37:42,969] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt... +28: [2023-05-10 12:37:42,969] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt... + 6: [2023-05-10 12:37:42,970] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... + 6: [2023-05-10 12:37:42,971] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +25: [2023-05-10 12:37:42,971] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +25: [2023-05-10 12:37:42,971] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt... +29: [2023-05-10 12:37:42,972] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +27: [2023-05-10 12:37:42,973] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +27: [2023-05-10 12:37:42,973] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +10: [2023-05-10 12:37:42,973] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +29: [2023-05-10 12:37:42,973] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt... +19: [2023-05-10 12:37:42,974] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt. +19: [2023-05-10 12:37:42,974] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt. +19: [2023-05-10 12:37:42,974] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt. +25: [2023-05-10 12:37:42,974] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +25: [2023-05-10 12:37:42,974] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt... +27: [2023-05-10 12:37:42,974] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +19: [2023-05-10 12:37:42,974] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt. +27: [2023-05-10 12:37:42,975] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +10: [2023-05-10 12:37:42,978] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +10: [2023-05-10 12:37:42,978] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +20: [2023-05-10 12:37:42,978] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt. +20: [2023-05-10 12:37:42,978] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt. +20: [2023-05-10 12:37:42,978] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt. +20: [2023-05-10 12:37:42,978] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt. +25: [2023-05-10 12:37:42,979] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. + 6: [2023-05-10 12:37:42,980] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +25: [2023-05-10 12:37:42,980] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt... + 6: [2023-05-10 12:37:42,980] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt... +10: [2023-05-10 12:37:42,981] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +13: [2023-05-10 12:37:42,981] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +13: [2023-05-10 12:37:42,981] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +14: [2023-05-10 12:37:42,981] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt. +14: [2023-05-10 12:37:42,981] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt. +13: [2023-05-10 12:37:42,981] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt... +13: [2023-05-10 12:37:42,981] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt... +14: [2023-05-10 12:37:42,981] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt. +13: [2023-05-10 12:37:42,982] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +13: [2023-05-10 12:37:42,982] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt... +14: [2023-05-10 12:37:42,983] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt. +25: [2023-05-10 12:37:42,983] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. + 9: [2023-05-10 12:37:42,984] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt. + 9: [2023-05-10 12:37:42,984] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt. +25: [2023-05-10 12:37:42,984] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt... +12: [2023-05-10 12:37:42,984] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt. + 9: [2023-05-10 12:37:42,984] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt. +12: [2023-05-10 12:37:42,984] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt. +12: [2023-05-10 12:37:42,984] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt. + 9: [2023-05-10 12:37:42,984] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt. +11: [2023-05-10 12:37:42,985] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt. +11: [2023-05-10 12:37:42,985] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt. +11: [2023-05-10 12:37:42,985] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt. +11: [2023-05-10 12:37:42,985] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt. +19: [2023-05-10 12:37:42,986] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... + 6: [2023-05-10 12:37:42,986] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. + 6: [2023-05-10 12:37:42,986] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. + 6: [2023-05-10 12:37:42,986] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt... + 6: [2023-05-10 12:37:42,986] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt... +13: [2023-05-10 12:37:42,987] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +12: [2023-05-10 12:37:42,986] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt. +13: [2023-05-10 12:37:42,987] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt... +31: [2023-05-10 12:37:42,987] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt. +31: [2023-05-10 12:37:42,987] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt. +31: [2023-05-10 12:37:42,987] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt. +31: [2023-05-10 12:37:42,988] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt. +20: [2023-05-10 12:37:42,988] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +27: [2023-05-10 12:37:42,988] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +27: [2023-05-10 12:37:42,988] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +27: [2023-05-10 12:37:42,988] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt... +27: [2023-05-10 12:37:42,988] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt... +20: [2023-05-10 12:37:42,989] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +20: [2023-05-10 12:37:42,990] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +10: [2023-05-10 12:37:42,989] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +14: [2023-05-10 12:37:42,990] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +19: [2023-05-10 12:37:42,990] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +20: [2023-05-10 12:37:42,990] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +19: [2023-05-10 12:37:42,990] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +27: [2023-05-10 12:37:42,991] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +27: [2023-05-10 12:37:42,991] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +27: [2023-05-10 12:37:42,991] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +10: [2023-05-10 12:37:42,991] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +27: [2023-05-10 12:37:42,991] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +27: [2023-05-10 12:37:42,991] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +27: [2023-05-10 12:37:42,991] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +27: [2023-05-10 12:37:42,992] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +27: [2023-05-10 12:37:42,992] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... + 6: [2023-05-10 12:37:42,991] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. + 6: [2023-05-10 12:37:42,991] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt... +14: [2023-05-10 12:37:42,992] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +14: [2023-05-10 12:37:42,993] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... + 9: [2023-05-10 12:37:42,993] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... + 1: [2023-05-10 12:37:42,993] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +14: [2023-05-10 12:37:42,993] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... + 1: [2023-05-10 12:37:42,993] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. + 1: [2023-05-10 12:37:42,993] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... + 1: [2023-05-10 12:37:42,993] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. + 1: [2023-05-10 12:37:42,994] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... + 1: [2023-05-10 12:37:42,994] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. + 1: [2023-05-10 12:37:42,994] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +27: [2023-05-10 12:37:42,994] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +27: [2023-05-10 12:37:42,994] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt... +19: [2023-05-10 12:37:42,994] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... + 9: [2023-05-10 12:37:42,995] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +11: [2023-05-10 12:37:42,995] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... + 1: [2023-05-10 12:37:42,995] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +11: [2023-05-10 12:37:42,995] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +12: [2023-05-10 12:37:42,996] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +12: [2023-05-10 12:37:42,996] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +11: [2023-05-10 12:37:42,997] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +31: [2023-05-10 12:37:42,997] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +31: [2023-05-10 12:37:42,997] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +12: [2023-05-10 12:37:42,997] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +12: [2023-05-10 12:37:42,997] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... + 9: [2023-05-10 12:37:42,997] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +27: [2023-05-10 12:37:42,997] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +27: [2023-05-10 12:37:42,997] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt... + 9: [2023-05-10 12:37:42,997] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +31: [2023-05-10 12:37:42,998] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +31: [2023-05-10 12:37:42,998] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +11: [2023-05-10 12:37:42,999] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +26: [2023-05-10 12:37:43,001] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +26: [2023-05-10 12:37:43,001] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +26: [2023-05-10 12:37:43,001] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +26: [2023-05-10 12:37:43,002] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +26: [2023-05-10 12:37:43,002] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +26: [2023-05-10 12:37:43,002] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +10: [2023-05-10 12:37:43,002] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. + 8: [2023-05-10 12:37:43,003] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt. + 8: [2023-05-10 12:37:43,003] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt. + 8: [2023-05-10 12:37:43,004] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt. + 8: [2023-05-10 12:37:43,004] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt. +27: [2023-05-10 12:37:43,004] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +26: [2023-05-10 12:37:43,004] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +26: [2023-05-10 12:37:43,004] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... + 8: [2023-05-10 12:37:43,005] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. + 8: [2023-05-10 12:37:43,005] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... + 8: [2023-05-10 12:37:43,005] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. + 8: [2023-05-10 12:37:43,005] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. + 8: [2023-05-10 12:37:43,005] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... + 8: [2023-05-10 12:37:43,005] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... + 8: [2023-05-10 12:37:43,005] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. + 8: [2023-05-10 12:37:43,005] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +27: [2023-05-10 12:37:43,006] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +27: [2023-05-10 12:37:43,006] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. + 9: [2023-05-10 12:37:43,007] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. + 9: [2023-05-10 12:37:43,007] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt... + 1: [2023-05-10 12:37:43,008] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +11: [2023-05-10 12:37:43,008] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +11: [2023-05-10 12:37:43,008] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt... +12: [2023-05-10 12:37:43,008] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +27: [2023-05-10 12:37:43,009] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +17: [2023-05-10 12:37:43,009] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt. +17: [2023-05-10 12:37:43,009] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt. +12: [2023-05-10 12:37:43,009] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt... +12: [2023-05-10 12:37:43,009] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +12: [2023-05-10 12:37:43,009] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt... + 1: [2023-05-10 12:37:43,009] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +19: [2023-05-10 12:37:43,009] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +19: [2023-05-10 12:37:43,009] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +19: [2023-05-10 12:37:43,009] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +19: [2023-05-10 12:37:43,009] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +19: [2023-05-10 12:37:43,010] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +19: [2023-05-10 12:37:43,010] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +19: [2023-05-10 12:37:43,010] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +19: [2023-05-10 12:37:43,010] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +19: [2023-05-10 12:37:43,010] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +19: [2023-05-10 12:37:43,010] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... + 1: [2023-05-10 12:37:43,010] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +19: [2023-05-10 12:37:43,010] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt... + 2: [2023-05-10 12:37:43,010] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt. +19: [2023-05-10 12:37:43,010] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt... + 2: [2023-05-10 12:37:43,010] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt. + 2: [2023-05-10 12:37:43,010] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt. + 2: [2023-05-10 12:37:43,010] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt. +12: [2023-05-10 12:37:43,011] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +12: [2023-05-10 12:37:43,011] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt... +12: [2023-05-10 12:37:43,011] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +12: [2023-05-10 12:37:43,011] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt... +10: [2023-05-10 12:37:43,011] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +17: [2023-05-10 12:37:43,012] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt. +17: [2023-05-10 12:37:43,012] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt. +27: [2023-05-10 12:37:43,012] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +11: [2023-05-10 12:37:43,012] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +11: [2023-05-10 12:37:43,013] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt... +26: [2023-05-10 12:37:43,013] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +19: [2023-05-10 12:37:43,013] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt... +19: [2023-05-10 12:37:43,013] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +26: [2023-05-10 12:37:43,014] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. + 8: [2023-05-10 12:37:43,014] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... + 8: [2023-05-10 12:37:43,015] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... + 8: [2023-05-10 12:37:43,015] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... + 9: [2023-05-10 12:37:43,015] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. + 9: [2023-05-10 12:37:43,015] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt... + 8: [2023-05-10 12:37:43,015] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +31: [2023-05-10 12:37:43,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +31: [2023-05-10 12:37:43,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +31: [2023-05-10 12:37:43,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt... +31: [2023-05-10 12:37:43,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt... +30: [2023-05-10 12:37:43,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +30: [2023-05-10 12:37:43,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +30: [2023-05-10 12:37:43,017] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +30: [2023-05-10 12:37:43,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +30: [2023-05-10 12:37:43,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. + 9: [2023-05-10 12:37:43,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. + 9: [2023-05-10 12:37:43,017] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt... +30: [2023-05-10 12:37:43,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +30: [2023-05-10 12:37:43,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +30: [2023-05-10 12:37:43,017] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +30: [2023-05-10 12:37:43,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +30: [2023-05-10 12:37:43,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +30: [2023-05-10 12:37:43,018] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +27: [2023-05-10 12:37:43,018] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +30: [2023-05-10 12:37:43,018] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt... +30: [2023-05-10 12:37:43,018] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt... + 9: [2023-05-10 12:37:43,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. + 9: [2023-05-10 12:37:43,018] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt... +15: [2023-05-10 12:37:43,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt. +15: [2023-05-10 12:37:43,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt. +17: [2023-05-10 12:37:43,018] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +15: [2023-05-10 12:37:43,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt. +13: [2023-05-10 12:37:43,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +13: [2023-05-10 12:37:43,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +13: [2023-05-10 12:37:43,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +13: [2023-05-10 12:37:43,019] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +13: [2023-05-10 12:37:43,019] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +13: [2023-05-10 12:37:43,019] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +13: [2023-05-10 12:37:43,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +15: [2023-05-10 12:37:43,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_16-model_01-model_states.pt. +30: [2023-05-10 12:37:43,019] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +30: [2023-05-10 12:37:43,020] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt... +30: [2023-05-10 12:37:43,020] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt... +31: [2023-05-10 12:37:43,020] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +31: [2023-05-10 12:37:43,020] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt... + 1: [2023-05-10 12:37:43,020] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +27: [2023-05-10 12:37:43,020] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +13: [2023-05-10 12:37:43,020] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... + 1: [2023-05-10 12:37:43,021] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +11: [2023-05-10 12:37:43,020] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. + 1: [2023-05-10 12:37:43,021] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +17: [2023-05-10 12:37:43,021] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +17: [2023-05-10 12:37:43,021] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +17: [2023-05-10 12:37:43,022] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... + 2: [2023-05-10 12:37:43,022] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +27: [2023-05-10 12:37:43,022] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... + 2: [2023-05-10 12:37:43,022] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +11: [2023-05-10 12:37:43,022] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt... +26: [2023-05-10 12:37:43,023] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +31: [2023-05-10 12:37:43,023] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +31: [2023-05-10 12:37:43,023] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt... +23: [2023-05-10 12:37:43,023] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +23: [2023-05-10 12:37:43,023] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +11: [2023-05-10 12:37:43,023] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +18: [2023-05-10 12:37:43,023] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +23: [2023-05-10 12:37:43,024] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +18: [2023-05-10 12:37:43,024] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +19: [2023-05-10 12:37:43,024] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +19: [2023-05-10 12:37:43,024] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +18: [2023-05-10 12:37:43,024] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +23: [2023-05-10 12:37:43,024] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +18: [2023-05-10 12:37:43,024] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +23: [2023-05-10 12:37:43,024] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... + 1: [2023-05-10 12:37:43,024] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +18: [2023-05-10 12:37:43,024] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +18: [2023-05-10 12:37:43,024] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +23: [2023-05-10 12:37:43,024] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +19: [2023-05-10 12:37:43,024] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +26: [2023-05-10 12:37:43,025] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... + 2: [2023-05-10 12:37:43,025] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... + 2: [2023-05-10 12:37:43,026] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +11: [2023-05-10 12:37:43,025] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt... +18: [2023-05-10 12:37:43,026] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +23: [2023-05-10 12:37:43,026] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +23: [2023-05-10 12:37:43,027] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +18: [2023-05-10 12:37:43,027] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +19: [2023-05-10 12:37:43,028] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. + 8: [2023-05-10 12:37:43,028] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +15: [2023-05-10 12:37:43,028] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +15: [2023-05-10 12:37:43,029] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +15: [2023-05-10 12:37:43,029] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... +19: [2023-05-10 12:37:43,031] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt... +13: [2023-05-10 12:37:43,031] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +15: [2023-05-10 12:37:43,032] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt... + 8: [2023-05-10 12:37:43,033] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. + 1: [2023-05-10 12:37:43,033] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +30: [2023-05-10 12:37:43,033] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. + 8: [2023-05-10 12:37:43,034] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt... +12: [2023-05-10 12:37:43,034] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +12: [2023-05-10 12:37:43,034] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +12: [2023-05-10 12:37:43,034] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +12: [2023-05-10 12:37:43,034] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +12: [2023-05-10 12:37:43,034] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +12: [2023-05-10 12:37:43,034] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +12: [2023-05-10 12:37:43,034] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +21: [2023-05-10 12:37:43,034] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +21: [2023-05-10 12:37:43,035] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +21: [2023-05-10 12:37:43,035] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +21: [2023-05-10 12:37:43,035] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +23: [2023-05-10 12:37:43,035] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +26: [2023-05-10 12:37:43,035] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +23: [2023-05-10 12:37:43,035] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +26: [2023-05-10 12:37:43,035] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +14: [2023-05-10 12:37:43,035] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +14: [2023-05-10 12:37:43,035] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +14: [2023-05-10 12:37:43,035] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +14: [2023-05-10 12:37:43,035] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +14: [2023-05-10 12:37:43,035] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +14: [2023-05-10 12:37:43,035] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +14: [2023-05-10 12:37:43,035] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +14: [2023-05-10 12:37:43,035] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +14: [2023-05-10 12:37:43,035] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +14: [2023-05-10 12:37:43,035] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +17: [2023-05-10 12:37:43,035] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +14: [2023-05-10 12:37:43,035] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +14: [2023-05-10 12:37:43,036] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt... +14: [2023-05-10 12:37:43,036] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt... +21: [2023-05-10 12:37:43,036] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +21: [2023-05-10 12:37:43,036] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +30: [2023-05-10 12:37:43,036] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +30: [2023-05-10 12:37:43,036] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +21: [2023-05-10 12:37:43,036] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +12: [2023-05-10 12:37:43,036] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +17: [2023-05-10 12:37:43,036] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt... +14: [2023-05-10 12:37:43,037] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt... + 2: [2023-05-10 12:37:43,037] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. + 2: [2023-05-10 12:37:43,037] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. + 2: [2023-05-10 12:37:43,037] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. + 2: [2023-05-10 12:37:43,037] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... + 2: [2023-05-10 12:37:43,037] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... + 2: [2023-05-10 12:37:43,037] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +14: [2023-05-10 12:37:43,037] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt... + 8: [2023-05-10 12:37:43,037] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. + 8: [2023-05-10 12:37:43,037] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. + 8: [2023-05-10 12:37:43,037] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +14: [2023-05-10 12:37:43,037] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +21: [2023-05-10 12:37:43,038] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... + 2: [2023-05-10 12:37:43,038] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. + 2: [2023-05-10 12:37:43,038] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +13: [2023-05-10 12:37:43,038] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +13: [2023-05-10 12:37:43,038] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +22: [2023-05-10 12:37:43,038] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. + 8: [2023-05-10 12:37:43,039] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +22: [2023-05-10 12:37:43,039] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +22: [2023-05-10 12:37:43,039] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +22: [2023-05-10 12:37:43,039] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +22: [2023-05-10 12:37:43,039] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +22: [2023-05-10 12:37:43,039] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +22: [2023-05-10 12:37:43,039] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +22: [2023-05-10 12:37:43,039] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +22: [2023-05-10 12:37:43,039] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +22: [2023-05-10 12:37:43,039] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +22: [2023-05-10 12:37:43,039] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +22: [2023-05-10 12:37:43,039] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +22: [2023-05-10 12:37:43,039] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt... +22: [2023-05-10 12:37:43,039] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt... +17: [2023-05-10 12:37:43,039] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +17: [2023-05-10 12:37:43,040] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt... + 2: [2023-05-10 12:37:43,039] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. + 2: [2023-05-10 12:37:43,039] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. + 2: [2023-05-10 12:37:43,040] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt... + 2: [2023-05-10 12:37:43,040] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt... +20: [2023-05-10 12:37:43,040] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +20: [2023-05-10 12:37:43,040] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +20: [2023-05-10 12:37:43,040] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +20: [2023-05-10 12:37:43,040] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +20: [2023-05-10 12:37:43,041] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt... +20: [2023-05-10 12:37:43,041] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt... +20: [2023-05-10 12:37:43,041] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +20: [2023-05-10 12:37:43,041] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +20: [2023-05-10 12:37:43,041] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +15: [2023-05-10 12:37:43,041] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +15: [2023-05-10 12:37:43,041] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +22: [2023-05-10 12:37:43,041] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt... +17: [2023-05-10 12:37:43,041] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +17: [2023-05-10 12:37:43,041] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +15: [2023-05-10 12:37:43,041] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +17: [2023-05-10 12:37:43,042] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt... +17: [2023-05-10 12:37:43,042] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt... +15: [2023-05-10 12:37:43,042] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +18: [2023-05-10 12:37:43,041] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +15: [2023-05-10 12:37:43,042] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +15: [2023-05-10 12:37:43,042] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +20: [2023-05-10 12:37:43,042] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +15: [2023-05-10 12:37:43,042] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +15: [2023-05-10 12:37:43,042] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +22: [2023-05-10 12:37:43,042] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt... +13: [2023-05-10 12:37:43,042] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... + 8: [2023-05-10 12:37:43,042] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. + 8: [2023-05-10 12:37:43,042] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt... +20: [2023-05-10 12:37:43,043] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +20: [2023-05-10 12:37:43,043] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt... +20: [2023-05-10 12:37:43,043] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +11: [2023-05-10 12:37:43,043] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +11: [2023-05-10 12:37:43,043] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +11: [2023-05-10 12:37:43,043] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +11: [2023-05-10 12:37:43,043] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +15: [2023-05-10 12:37:43,043] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +11: [2023-05-10 12:37:43,043] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +10: [2023-05-10 12:37:43,043] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt. +11: [2023-05-10 12:37:43,043] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +20: [2023-05-10 12:37:43,043] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +11: [2023-05-10 12:37:43,043] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +10: [2023-05-10 12:37:43,044] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt. +30: [2023-05-10 12:37:43,044] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +11: [2023-05-10 12:37:43,044] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +15: [2023-05-10 12:37:43,044] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt... +23: [2023-05-10 12:37:43,044] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +19: [2023-05-10 12:37:43,044] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +26: [2023-05-10 12:37:43,044] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +26: [2023-05-10 12:37:43,044] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +20: [2023-05-10 12:37:43,044] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +30: [2023-05-10 12:37:43,045] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +23: [2023-05-10 12:37:43,045] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +20: [2023-05-10 12:37:43,045] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt... +30: [2023-05-10 12:37:43,045] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +30: [2023-05-10 12:37:43,045] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +10: [2023-05-10 12:37:43,046] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt. +19: [2023-05-10 12:37:43,046] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +19: [2023-05-10 12:37:43,046] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +10: [2023-05-10 12:37:43,046] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt. +19: [2023-05-10 12:37:43,046] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. + 8: [2023-05-10 12:37:43,047] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. + 8: [2023-05-10 12:37:43,047] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt... +15: [2023-05-10 12:37:43,047] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +15: [2023-05-10 12:37:43,047] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +15: [2023-05-10 12:37:43,047] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt... +15: [2023-05-10 12:37:43,047] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt... +12: [2023-05-10 12:37:43,048] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. + 1: [2023-05-10 12:37:43,048] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt. + 1: [2023-05-10 12:37:43,048] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt. + 1: [2023-05-10 12:37:43,048] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt. + 8: [2023-05-10 12:37:43,048] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... + 1: [2023-05-10 12:37:43,048] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt. + 8: [2023-05-10 12:37:43,048] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +18: [2023-05-10 12:37:43,048] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +13: [2023-05-10 12:37:43,049] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... + 8: [2023-05-10 12:37:43,049] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +14: [2023-05-10 12:37:43,049] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +13: [2023-05-10 12:37:43,050] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... + 8: [2023-05-10 12:37:43,050] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. + 8: [2023-05-10 12:37:43,050] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt... +22: [2023-05-10 12:37:43,050] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +12: [2023-05-10 12:37:43,050] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +12: [2023-05-10 12:37:43,050] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +18: [2023-05-10 12:37:43,051] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... + 2: [2023-05-10 12:37:43,051] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +14: [2023-05-10 12:37:43,051] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +14: [2023-05-10 12:37:43,051] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +21: [2023-05-10 12:37:43,051] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +21: [2023-05-10 12:37:43,051] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +21: [2023-05-10 12:37:43,051] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. + 0: [2023-05-10 12:37:43,053] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +10: [2023-05-10 12:37:43,053] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... + 0: [2023-05-10 12:37:43,053] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +10: [2023-05-10 12:37:43,053] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... + 0: [2023-05-10 12:37:43,053] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. + 0: [2023-05-10 12:37:43,053] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... + 2: [2023-05-10 12:37:43,053] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. + 2: [2023-05-10 12:37:43,054] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +30: [2023-05-10 12:37:43,054] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +15: [2023-05-10 12:37:43,054] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +20: [2023-05-10 12:37:43,054] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +23: [2023-05-10 12:37:43,055] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. + 2: [2023-05-10 12:37:43,055] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +23: [2023-05-10 12:37:43,055] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +13: [2023-05-10 12:37:43,056] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. + 0: [2023-05-10 12:37:43,056] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. + 0: [2023-05-10 12:37:43,057] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. + 1: [2023-05-10 12:37:43,057] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... + 1: [2023-05-10 12:37:43,058] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... + 1: [2023-05-10 12:37:43,058] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... + 2: [2023-05-10 12:37:43,058] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. +11: [2023-05-10 12:37:43,058] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +11: [2023-05-10 12:37:43,058] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +11: [2023-05-10 12:37:43,058] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +19: [2023-05-10 12:37:43,058] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +11: [2023-05-10 12:37:43,058] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. + 2: [2023-05-10 12:37:43,058] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt... + 2: [2023-05-10 12:37:43,058] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +20: [2023-05-10 12:37:43,059] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +10: [2023-05-10 12:37:43,059] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +10: [2023-05-10 12:37:43,059] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... + 0: [2023-05-10 12:37:43,059] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +12: [2023-05-10 12:37:43,059] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... + 1: [2023-05-10 12:37:43,060] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +22: [2023-05-10 12:37:43,059] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +22: [2023-05-10 12:37:43,059] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +22: [2023-05-10 12:37:43,059] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +12: [2023-05-10 12:37:43,060] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +15: [2023-05-10 12:37:43,060] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +14: [2023-05-10 12:37:43,060] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... + 2: [2023-05-10 12:37:43,061] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... + 0: [2023-05-10 12:37:43,061] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +12: [2023-05-10 12:37:43,061] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +22: [2023-05-10 12:37:43,061] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +15: [2023-05-10 12:37:43,061] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +18: [2023-05-10 12:37:43,061] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +15: [2023-05-10 12:37:43,061] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +21: [2023-05-10 12:37:43,061] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... + 2: [2023-05-10 12:37:43,062] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt... +14: [2023-05-10 12:37:43,062] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +14: [2023-05-10 12:37:43,062] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +20: [2023-05-10 12:37:43,063] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +15: [2023-05-10 12:37:43,063] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +12: [2023-05-10 12:37:43,063] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +15: [2023-05-10 12:37:43,063] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_00-model_states.pt. + 2: [2023-05-10 12:37:43,064] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +20: [2023-05-10 12:37:43,064] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +23: [2023-05-10 12:37:43,064] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... + 0: [2023-05-10 12:37:43,065] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt. + 0: [2023-05-10 12:37:43,065] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt. +16: [2023-05-10 12:37:43,065] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt. +16: [2023-05-10 12:37:43,065] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt. +16: [2023-05-10 12:37:43,065] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt. +21: [2023-05-10 12:37:43,065] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +16: [2023-05-10 12:37:43,065] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt. +21: [2023-05-10 12:37:43,065] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... + 2: [2023-05-10 12:37:43,065] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +13: [2023-05-10 12:37:43,065] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +15: [2023-05-10 12:37:43,065] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt... +14: [2023-05-10 12:37:43,066] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +18: [2023-05-10 12:37:43,066] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +23: [2023-05-10 12:37:43,067] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +18: [2023-05-10 12:37:43,067] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. + 2: [2023-05-10 12:37:43,068] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +21: [2023-05-10 12:37:43,068] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +20: [2023-05-10 12:37:43,069] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +11: [2023-05-10 12:37:43,069] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +22: [2023-05-10 12:37:43,069] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +10: [2023-05-10 12:37:43,069] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. + 0: [2023-05-10 12:37:43,070] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt. + 0: [2023-05-10 12:37:43,070] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt. + 1: [2023-05-10 12:37:43,070] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +10: [2023-05-10 12:37:43,070] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt... + 5: [2023-05-10 12:37:43,070] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt. + 5: [2023-05-10 12:37:43,070] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt. +15: [2023-05-10 12:37:43,070] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +20: [2023-05-10 12:37:43,071] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... + 3: [2023-05-10 12:37:43,071] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt. + 3: [2023-05-10 12:37:43,071] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt. + 1: [2023-05-10 12:37:43,071] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt... + 5: [2023-05-10 12:37:43,071] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt. +15: [2023-05-10 12:37:43,071] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... + 5: [2023-05-10 12:37:43,071] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt. +11: [2023-05-10 12:37:43,071] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +24: [2023-05-10 12:37:43,072] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt. +24: [2023-05-10 12:37:43,072] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt. +11: [2023-05-10 12:37:43,072] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +11: [2023-05-10 12:37:43,072] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +15: [2023-05-10 12:37:43,073] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +12: [2023-05-10 12:37:43,073] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +22: [2023-05-10 12:37:43,073] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +22: [2023-05-10 12:37:43,073] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +10: [2023-05-10 12:37:43,073] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +10: [2023-05-10 12:37:43,073] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt... +10: [2023-05-10 12:37:43,073] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +10: [2023-05-10 12:37:43,074] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt... +16: [2023-05-10 12:37:43,074] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... + 1: [2023-05-10 12:37:43,074] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. + 1: [2023-05-10 12:37:43,074] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt... + 1: [2023-05-10 12:37:43,074] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. + 1: [2023-05-10 12:37:43,074] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt... +16: [2023-05-10 12:37:43,074] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +16: [2023-05-10 12:37:43,074] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +20: [2023-05-10 12:37:43,075] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +24: [2023-05-10 12:37:43,075] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt. +24: [2023-05-10 12:37:43,075] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt. +18: [2023-05-10 12:37:43,076] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +14: [2023-05-10 12:37:43,076] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... + 3: [2023-05-10 12:37:43,076] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt. +16: [2023-05-10 12:37:43,076] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +18: [2023-05-10 12:37:43,077] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... + 0: [2023-05-10 12:37:43,077] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... + 0: [2023-05-10 12:37:43,077] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +21: [2023-05-10 12:37:43,077] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +23: [2023-05-10 12:37:43,077] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt. +10: [2023-05-10 12:37:43,078] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +10: [2023-05-10 12:37:43,078] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt... + 3: [2023-05-10 12:37:43,078] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt. +20: [2023-05-10 12:37:43,080] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... + 0: [2023-05-10 12:37:43,079] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. + 0: [2023-05-10 12:37:43,079] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +23: [2023-05-10 12:37:43,080] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt. + 3: [2023-05-10 12:37:43,080] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +24: [2023-05-10 12:37:43,080] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +24: [2023-05-10 12:37:43,080] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +25: [2023-05-10 12:37:43,081] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt. +13: [2023-05-10 12:37:43,081] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt. +23: [2023-05-10 12:37:43,081] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt. +13: [2023-05-10 12:37:43,081] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt. +13: [2023-05-10 12:37:43,081] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt. +25: [2023-05-10 12:37:43,081] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt. + 5: [2023-05-10 12:37:43,081] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +13: [2023-05-10 12:37:43,081] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt. + 5: [2023-05-10 12:37:43,081] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +23: [2023-05-10 12:37:43,081] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt. +25: [2023-05-10 12:37:43,082] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt. + 3: [2023-05-10 12:37:43,082] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +25: [2023-05-10 12:37:43,083] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt. + 0: [2023-05-10 12:37:43,083] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... + 0: [2023-05-10 12:37:43,083] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... + 5: [2023-05-10 12:37:43,084] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... + 5: [2023-05-10 12:37:43,084] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... + 3: [2023-05-10 12:37:43,086] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +18: [2023-05-10 12:37:43,086] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt. +18: [2023-05-10 12:37:43,086] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt. +18: [2023-05-10 12:37:43,086] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt. + 1: [2023-05-10 12:37:43,087] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +18: [2023-05-10 12:37:43,087] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt. +23: [2023-05-10 12:37:43,087] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +24: [2023-05-10 12:37:43,087] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +24: [2023-05-10 12:37:43,087] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... + 3: [2023-05-10 12:37:43,088] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... + 1: [2023-05-10 12:37:43,088] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt... +16: [2023-05-10 12:37:43,089] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +16: [2023-05-10 12:37:43,089] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt... +16: [2023-05-10 12:37:43,089] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +16: [2023-05-10 12:37:43,089] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +16: [2023-05-10 12:37:43,090] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt... +16: [2023-05-10 12:37:43,090] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt... +23: [2023-05-10 12:37:43,090] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +25: [2023-05-10 12:37:43,091] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +13: [2023-05-10 12:37:43,091] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +23: [2023-05-10 12:37:43,091] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +23: [2023-05-10 12:37:43,091] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +13: [2023-05-10 12:37:43,091] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +13: [2023-05-10 12:37:43,091] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +25: [2023-05-10 12:37:43,092] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... + 0: [2023-05-10 12:37:43,091] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +25: [2023-05-10 12:37:43,093] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +25: [2023-05-10 12:37:43,093] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... + 0: [2023-05-10 12:37:43,094] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +28: [2023-05-10 12:37:43,095] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +13: [2023-05-10 12:37:43,095] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +28: [2023-05-10 12:37:43,095] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +28: [2023-05-10 12:37:43,095] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +28: [2023-05-10 12:37:43,095] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +28: [2023-05-10 12:37:43,095] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +28: [2023-05-10 12:37:43,095] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +28: [2023-05-10 12:37:43,096] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +18: [2023-05-10 12:37:43,096] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +18: [2023-05-10 12:37:43,096] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +18: [2023-05-10 12:37:43,097] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +18: [2023-05-10 12:37:43,097] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +28: [2023-05-10 12:37:43,097] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... + 0: [2023-05-10 12:37:43,097] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. + 3: [2023-05-10 12:37:43,096] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +16: [2023-05-10 12:37:43,097] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +16: [2023-05-10 12:37:43,097] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +16: [2023-05-10 12:37:43,097] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +16: [2023-05-10 12:37:43,097] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +16: [2023-05-10 12:37:43,097] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +16: [2023-05-10 12:37:43,097] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +16: [2023-05-10 12:37:43,097] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. + 5: [2023-05-10 12:37:43,097] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. + 5: [2023-05-10 12:37:43,097] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. + 5: [2023-05-10 12:37:43,097] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... + 5: [2023-05-10 12:37:43,097] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. + 3: [2023-05-10 12:37:43,097] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt... + 5: [2023-05-10 12:37:43,097] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. + 5: [2023-05-10 12:37:43,097] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. + 5: [2023-05-10 12:37:43,098] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... + 5: [2023-05-10 12:37:43,098] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... + 5: [2023-05-10 12:37:43,098] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt... + 0: [2023-05-10 12:37:43,098] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt... + 5: [2023-05-10 12:37:43,099] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +16: [2023-05-10 12:37:43,099] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +24: [2023-05-10 12:37:43,100] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +24: [2023-05-10 12:37:43,100] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +24: [2023-05-10 12:37:43,100] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt... +24: [2023-05-10 12:37:43,100] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt... + 7: [2023-05-10 12:37:43,100] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt. +16: [2023-05-10 12:37:43,100] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. + 3: [2023-05-10 12:37:43,101] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. + 3: [2023-05-10 12:37:43,101] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt... + 3: [2023-05-10 12:37:43,101] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. + 3: [2023-05-10 12:37:43,101] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt... + 0: [2023-05-10 12:37:43,101] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. + 0: [2023-05-10 12:37:43,101] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt... +24: [2023-05-10 12:37:43,101] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +24: [2023-05-10 12:37:43,101] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +24: [2023-05-10 12:37:43,101] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt... +24: [2023-05-10 12:37:43,101] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt... + 7: [2023-05-10 12:37:43,102] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt. +16: [2023-05-10 12:37:43,102] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt... + 7: [2023-05-10 12:37:43,104] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt. + 5: [2023-05-10 12:37:43,104] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. + 7: [2023-05-10 12:37:43,104] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt. +25: [2023-05-10 12:37:43,104] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +25: [2023-05-10 12:37:43,105] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt... +23: [2023-05-10 12:37:43,105] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. + 5: [2023-05-10 12:37:43,105] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt... +23: [2023-05-10 12:37:43,105] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +23: [2023-05-10 12:37:43,106] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt... +23: [2023-05-10 12:37:43,106] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt... +25: [2023-05-10 12:37:43,106] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +25: [2023-05-10 12:37:43,106] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt... +13: [2023-05-10 12:37:43,107] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +13: [2023-05-10 12:37:43,107] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +13: [2023-05-10 12:37:43,107] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt... +13: [2023-05-10 12:37:43,107] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt... +13: [2023-05-10 12:37:43,107] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +25: [2023-05-10 12:37:43,108] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +25: [2023-05-10 12:37:43,109] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt... +13: [2023-05-10 12:37:43,109] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt... + 4: [2023-05-10 12:37:43,110] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt. + 4: [2023-05-10 12:37:43,110] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt. + 5: [2023-05-10 12:37:43,110] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +16: [2023-05-10 12:37:43,110] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. + 7: [2023-05-10 12:37:43,111] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +23: [2023-05-10 12:37:43,111] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. + 4: [2023-05-10 12:37:43,111] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt. +23: [2023-05-10 12:37:43,111] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +23: [2023-05-10 12:37:43,111] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt... +23: [2023-05-10 12:37:43,112] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt... + 4: [2023-05-10 12:37:43,112] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt. + 7: [2023-05-10 12:37:43,112] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +28: [2023-05-10 12:37:43,112] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +28: [2023-05-10 12:37:43,112] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. + 0: [2023-05-10 12:37:43,112] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. + 0: [2023-05-10 12:37:43,112] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. + 0: [2023-05-10 12:37:43,112] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt... + 0: [2023-05-10 12:37:43,113] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt... +16: [2023-05-10 12:37:43,112] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +16: [2023-05-10 12:37:43,112] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. + 5: [2023-05-10 12:37:43,112] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. + 7: [2023-05-10 12:37:43,114] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... + 3: [2023-05-10 12:37:43,114] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. + 7: [2023-05-10 12:37:43,114] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +25: [2023-05-10 12:37:43,114] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +25: [2023-05-10 12:37:43,114] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt... + 4: [2023-05-10 12:37:43,114] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. + 4: [2023-05-10 12:37:43,114] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. + 4: [2023-05-10 12:37:43,114] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. + 4: [2023-05-10 12:37:43,114] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... + 4: [2023-05-10 12:37:43,114] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... + 4: [2023-05-10 12:37:43,114] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... + 5: [2023-05-10 12:37:43,114] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt... + 4: [2023-05-10 12:37:43,115] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. + 3: [2023-05-10 12:37:43,116] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt... +18: [2023-05-10 12:37:43,116] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +18: [2023-05-10 12:37:43,116] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +18: [2023-05-10 12:37:43,116] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. + 4: [2023-05-10 12:37:43,116] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +18: [2023-05-10 12:37:43,116] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. + 0: [2023-05-10 12:37:43,116] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. + 0: [2023-05-10 12:37:43,117] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +18: [2023-05-10 12:37:43,117] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt... +18: [2023-05-10 12:37:43,117] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt... +18: [2023-05-10 12:37:43,117] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt... +18: [2023-05-10 12:37:43,117] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt... + 5: [2023-05-10 12:37:43,117] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +27: [2023-05-10 12:37:43,117] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt. +27: [2023-05-10 12:37:43,117] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt. +27: [2023-05-10 12:37:43,117] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt. +27: [2023-05-10 12:37:43,117] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt. + 5: [2023-05-10 12:37:43,117] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +21: [2023-05-10 12:37:43,119] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt. +21: [2023-05-10 12:37:43,119] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt. + 4: [2023-05-10 12:37:43,119] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +12: [2023-05-10 12:37:43,119] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt. +12: [2023-05-10 12:37:43,119] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt. + 4: [2023-05-10 12:37:43,120] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +12: [2023-05-10 12:37:43,120] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt. +28: [2023-05-10 12:37:43,120] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +12: [2023-05-10 12:37:43,120] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt. + 5: [2023-05-10 12:37:43,120] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +21: [2023-05-10 12:37:43,121] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt. +28: [2023-05-10 12:37:43,121] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +21: [2023-05-10 12:37:43,121] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt. + 4: [2023-05-10 12:37:43,122] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... + 5: [2023-05-10 12:37:43,122] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +16: [2023-05-10 12:37:43,122] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... + 4: [2023-05-10 12:37:43,122] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... + 5: [2023-05-10 12:37:43,123] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt... +16: [2023-05-10 12:37:43,123] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +16: [2023-05-10 12:37:43,123] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +13: [2023-05-10 12:37:43,124] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +28: [2023-05-10 12:37:43,125] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +13: [2023-05-10 12:37:43,125] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt... +27: [2023-05-10 12:37:43,126] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +27: [2023-05-10 12:37:43,126] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... + 7: [2023-05-10 12:37:43,127] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. + 5: [2023-05-10 12:37:43,127] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... + 0: [2023-05-10 12:37:43,127] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... + 7: [2023-05-10 12:37:43,127] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt... + 7: [2023-05-10 12:37:43,128] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. + 7: [2023-05-10 12:37:43,128] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt... + 0: [2023-05-10 12:37:43,128] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +28: [2023-05-10 12:37:43,128] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... + 5: [2023-05-10 12:37:43,128] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +27: [2023-05-10 12:37:43,128] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +27: [2023-05-10 12:37:43,128] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +21: [2023-05-10 12:37:43,129] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... + 7: [2023-05-10 12:37:43,129] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. + 7: [2023-05-10 12:37:43,129] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt... +21: [2023-05-10 12:37:43,130] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +16: [2023-05-10 12:37:43,129] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +12: [2023-05-10 12:37:43,131] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +21: [2023-05-10 12:37:43,131] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +21: [2023-05-10 12:37:43,131] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +12: [2023-05-10 12:37:43,131] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +12: [2023-05-10 12:37:43,132] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +12: [2023-05-10 12:37:43,132] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... + 5: [2023-05-10 12:37:43,132] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +28: [2023-05-10 12:37:43,133] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. + 4: [2023-05-10 12:37:43,133] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. + 4: [2023-05-10 12:37:43,134] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. + 7: [2023-05-10 12:37:43,134] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. + 7: [2023-05-10 12:37:43,134] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt... +16: [2023-05-10 12:37:43,138] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +27: [2023-05-10 12:37:43,139] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +27: [2023-05-10 12:37:43,139] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +26: [2023-05-10 12:37:43,139] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt. +27: [2023-05-10 12:37:43,139] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt... +27: [2023-05-10 12:37:43,139] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt... +26: [2023-05-10 12:37:43,139] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt. +26: [2023-05-10 12:37:43,139] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt. +26: [2023-05-10 12:37:43,139] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt. + 5: [2023-05-10 12:37:43,141] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... + 4: [2023-05-10 12:37:43,141] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. + 4: [2023-05-10 12:37:43,141] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. + 7: [2023-05-10 12:37:43,141] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. + 7: [2023-05-10 12:37:43,141] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. + 7: [2023-05-10 12:37:43,141] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. + 7: [2023-05-10 12:37:43,141] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... + 7: [2023-05-10 12:37:43,141] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... + 7: [2023-05-10 12:37:43,141] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... + 7: [2023-05-10 12:37:43,142] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. + 4: [2023-05-10 12:37:43,142] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. + 4: [2023-05-10 12:37:43,142] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. + 4: [2023-05-10 12:37:43,142] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. + 4: [2023-05-10 12:37:43,142] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt... + 4: [2023-05-10 12:37:43,142] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt... + 4: [2023-05-10 12:37:43,142] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt... + 4: [2023-05-10 12:37:43,142] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt... + 4: [2023-05-10 12:37:43,143] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +28: [2023-05-10 12:37:43,143] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... + 9: [2023-05-10 12:37:43,143] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt. + 9: [2023-05-10 12:37:43,143] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt. + 9: [2023-05-10 12:37:43,143] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt. +21: [2023-05-10 12:37:43,144] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. + 7: [2023-05-10 12:37:43,144] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... + 4: [2023-05-10 12:37:43,145] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. + 4: [2023-05-10 12:37:43,145] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +21: [2023-05-10 12:37:43,145] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +21: [2023-05-10 12:37:43,145] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt... +21: [2023-05-10 12:37:43,145] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt... + 9: [2023-05-10 12:37:43,145] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt. +27: [2023-05-10 12:37:43,148] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +27: [2023-05-10 12:37:43,148] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +27: [2023-05-10 12:37:43,149] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt... +27: [2023-05-10 12:37:43,149] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt... +26: [2023-05-10 12:37:43,149] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +26: [2023-05-10 12:37:43,149] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +12: [2023-05-10 12:37:43,150] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +12: [2023-05-10 12:37:43,151] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt... +21: [2023-05-10 12:37:43,151] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +21: [2023-05-10 12:37:43,151] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt... + 4: [2023-05-10 12:37:43,151] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +26: [2023-05-10 12:37:43,153] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +26: [2023-05-10 12:37:43,153] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... + 4: [2023-05-10 12:37:43,154] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... + 9: [2023-05-10 12:37:43,154] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +12: [2023-05-10 12:37:43,154] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. + 9: [2023-05-10 12:37:43,155] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... + 9: [2023-05-10 12:37:43,155] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +12: [2023-05-10 12:37:43,155] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +21: [2023-05-10 12:37:43,155] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. + 9: [2023-05-10 12:37:43,155] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +12: [2023-05-10 12:37:43,156] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt... + 7: [2023-05-10 12:37:43,155] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +12: [2023-05-10 12:37:43,156] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +21: [2023-05-10 12:37:43,156] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt... +12: [2023-05-10 12:37:43,157] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt... +12: [2023-05-10 12:37:43,157] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt... +25: [2023-05-10 12:37:43,157] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +25: [2023-05-10 12:37:43,158] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +25: [2023-05-10 12:37:43,158] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +25: [2023-05-10 12:37:43,158] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +25: [2023-05-10 12:37:43,158] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +25: [2023-05-10 12:37:43,158] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +25: [2023-05-10 12:37:43,158] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +25: [2023-05-10 12:37:43,159] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... + 7: [2023-05-10 12:37:43,160] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. + 7: [2023-05-10 12:37:43,161] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +24: [2023-05-10 12:37:43,161] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +24: [2023-05-10 12:37:43,161] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +24: [2023-05-10 12:37:43,161] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +24: [2023-05-10 12:37:43,161] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +24: [2023-05-10 12:37:43,162] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +24: [2023-05-10 12:37:43,162] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +24: [2023-05-10 12:37:43,162] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +24: [2023-05-10 12:37:43,162] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +26: [2023-05-10 12:37:43,162] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +26: [2023-05-10 12:37:43,163] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt... + 7: [2023-05-10 12:37:43,165] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +25: [2023-05-10 12:37:43,170] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. + 7: [2023-05-10 12:37:43,170] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +26: [2023-05-10 12:37:43,171] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +26: [2023-05-10 12:37:43,171] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt... + 7: [2023-05-10 12:37:43,173] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +25: [2023-05-10 12:37:43,173] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +25: [2023-05-10 12:37:43,173] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. + 9: [2023-05-10 12:37:43,174] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. + 9: [2023-05-10 12:37:43,174] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt... +24: [2023-05-10 12:37:43,174] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. + 9: [2023-05-10 12:37:43,175] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. + 9: [2023-05-10 12:37:43,175] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt... +24: [2023-05-10 12:37:43,175] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. + 9: [2023-05-10 12:37:43,176] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. + 9: [2023-05-10 12:37:43,176] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. + 9: [2023-05-10 12:37:43,176] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt... + 9: [2023-05-10 12:37:43,176] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt... +24: [2023-05-10 12:37:43,177] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +24: [2023-05-10 12:37:43,177] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +26: [2023-05-10 12:37:43,178] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +25: [2023-05-10 12:37:43,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +26: [2023-05-10 12:37:43,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt... + 7: [2023-05-10 12:37:43,181] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +25: [2023-05-10 12:37:43,182] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +25: [2023-05-10 12:37:43,183] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +25: [2023-05-10 12:37:43,184] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +24: [2023-05-10 12:37:43,184] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +24: [2023-05-10 12:37:43,184] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +26: [2023-05-10 12:37:43,185] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +31: [2023-05-10 12:37:43,185] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +31: [2023-05-10 12:37:43,185] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +31: [2023-05-10 12:37:43,185] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +31: [2023-05-10 12:37:43,185] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +31: [2023-05-10 12:37:43,186] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +31: [2023-05-10 12:37:43,186] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +31: [2023-05-10 12:37:43,186] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +31: [2023-05-10 12:37:43,187] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +24: [2023-05-10 12:37:43,187] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +26: [2023-05-10 12:37:43,187] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt... + 3: [2023-05-10 12:37:43,188] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. + 3: [2023-05-10 12:37:43,188] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... + 3: [2023-05-10 12:37:43,188] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. + 3: [2023-05-10 12:37:43,188] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. + 3: [2023-05-10 12:37:43,188] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. + 3: [2023-05-10 12:37:43,188] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... + 3: [2023-05-10 12:37:43,188] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... + 3: [2023-05-10 12:37:43,188] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +17: [2023-05-10 12:37:43,189] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +17: [2023-05-10 12:37:43,189] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +17: [2023-05-10 12:37:43,189] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +17: [2023-05-10 12:37:43,189] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +17: [2023-05-10 12:37:43,189] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +17: [2023-05-10 12:37:43,189] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... + 7: [2023-05-10 12:37:43,189] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +25: [2023-05-10 12:37:43,190] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +17: [2023-05-10 12:37:43,190] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +24: [2023-05-10 12:37:43,191] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +29: [2023-05-10 12:37:43,191] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +29: [2023-05-10 12:37:43,191] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +29: [2023-05-10 12:37:43,191] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +17: [2023-05-10 12:37:43,192] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +29: [2023-05-10 12:37:43,192] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +15: [2023-05-10 12:37:43,192] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt. +15: [2023-05-10 12:37:43,192] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt. +15: [2023-05-10 12:37:43,192] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt. +15: [2023-05-10 12:37:43,192] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt. + 9: [2023-05-10 12:37:43,192] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. + 9: [2023-05-10 12:37:43,192] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. + 9: [2023-05-10 12:37:43,192] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... + 9: [2023-05-10 12:37:43,192] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... + 9: [2023-05-10 12:37:43,192] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. + 9: [2023-05-10 12:37:43,193] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. + 2: [2023-05-10 12:37:43,193] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt. + 2: [2023-05-10 12:37:43,193] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt. + 2: [2023-05-10 12:37:43,193] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt. +29: [2023-05-10 12:37:43,193] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... + 2: [2023-05-10 12:37:43,193] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_17-model_01-model_states.pt. +29: [2023-05-10 12:37:43,193] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +29: [2023-05-10 12:37:43,193] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +29: [2023-05-10 12:37:43,193] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +10: [2023-05-10 12:37:43,194] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +10: [2023-05-10 12:37:43,194] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +10: [2023-05-10 12:37:43,194] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +10: [2023-05-10 12:37:43,194] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... + 9: [2023-05-10 12:37:43,194] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... + 9: [2023-05-10 12:37:43,195] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +10: [2023-05-10 12:37:43,195] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +10: [2023-05-10 12:37:43,195] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +10: [2023-05-10 12:37:43,195] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... + 6: [2023-05-10 12:37:43,196] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. + 6: [2023-05-10 12:37:43,196] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. + 6: [2023-05-10 12:37:43,196] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... + 6: [2023-05-10 12:37:43,196] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. + 6: [2023-05-10 12:37:43,196] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... + 6: [2023-05-10 12:37:43,196] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... + 6: [2023-05-10 12:37:43,196] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +10: [2023-05-10 12:37:43,196] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +31: [2023-05-10 12:37:43,196] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +28: [2023-05-10 12:37:43,197] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt. +28: [2023-05-10 12:37:43,197] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt. +27: [2023-05-10 12:37:43,197] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +28: [2023-05-10 12:37:43,197] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt. + 6: [2023-05-10 12:37:43,198] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +27: [2023-05-10 12:37:43,198] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +28: [2023-05-10 12:37:43,198] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt. +27: [2023-05-10 12:37:43,198] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +27: [2023-05-10 12:37:43,198] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +27: [2023-05-10 12:37:43,199] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +27: [2023-05-10 12:37:43,199] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. + 3: [2023-05-10 12:37:43,199] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +31: [2023-05-10 12:37:43,200] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +31: [2023-05-10 12:37:43,200] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +27: [2023-05-10 12:37:43,201] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +15: [2023-05-10 12:37:43,201] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +27: [2023-05-10 12:37:43,201] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +17: [2023-05-10 12:37:43,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. + 2: [2023-05-10 12:37:43,203] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +15: [2023-05-10 12:37:43,203] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... + 2: [2023-05-10 12:37:43,204] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... + 2: [2023-05-10 12:37:43,204] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... + 2: [2023-05-10 12:37:43,204] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +15: [2023-05-10 12:37:43,204] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +15: [2023-05-10 12:37:43,204] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt... +11: [2023-05-10 12:37:43,204] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt. +11: [2023-05-10 12:37:43,204] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt. +17: [2023-05-10 12:37:43,204] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +11: [2023-05-10 12:37:43,205] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt. +11: [2023-05-10 12:37:43,205] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt. + 9: [2023-05-10 12:37:43,205] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +31: [2023-05-10 12:37:43,206] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... + 9: [2023-05-10 12:37:43,207] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +28: [2023-05-10 12:37:43,207] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +28: [2023-05-10 12:37:43,207] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +28: [2023-05-10 12:37:43,207] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... + 3: [2023-05-10 12:37:43,208] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. + 3: [2023-05-10 12:37:43,208] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. + 3: [2023-05-10 12:37:43,208] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. + 3: [2023-05-10 12:37:43,208] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +10: [2023-05-10 12:37:43,207] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +28: [2023-05-10 12:37:43,208] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +31: [2023-05-10 12:37:43,209] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +17: [2023-05-10 12:37:43,209] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +27: [2023-05-10 12:37:43,209] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +17: [2023-05-10 12:37:43,210] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +31: [2023-05-10 12:37:43,210] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +10: [2023-05-10 12:37:43,211] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +27: [2023-05-10 12:37:43,211] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +31: [2023-05-10 12:37:43,211] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... + 6: [2023-05-10 12:37:43,211] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +17: [2023-05-10 12:37:43,213] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... + 6: [2023-05-10 12:37:43,213] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. + 6: [2023-05-10 12:37:43,213] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. + 9: [2023-05-10 12:37:43,213] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +11: [2023-05-10 12:37:43,213] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +15: [2023-05-10 12:37:43,214] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +29: [2023-05-10 12:37:43,214] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +15: [2023-05-10 12:37:43,215] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt... + 9: [2023-05-10 12:37:43,216] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +10: [2023-05-10 12:37:43,216] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +29: [2023-05-10 12:37:43,216] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +11: [2023-05-10 12:37:43,216] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +11: [2023-05-10 12:37:43,217] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... + 3: [2023-05-10 12:37:43,217] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +11: [2023-05-10 12:37:43,217] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +29: [2023-05-10 12:37:43,217] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +29: [2023-05-10 12:37:43,217] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. + 3: [2023-05-10 12:37:43,218] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +27: [2023-05-10 12:37:43,218] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... + 3: [2023-05-10 12:37:43,218] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... + 2: [2023-05-10 12:37:43,218] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. + 6: [2023-05-10 12:37:43,219] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt. + 6: [2023-05-10 12:37:43,219] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt. + 6: [2023-05-10 12:37:43,219] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt. +31: [2023-05-10 12:37:43,219] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... + 6: [2023-05-10 12:37:43,219] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt. +17: [2023-05-10 12:37:43,219] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +28: [2023-05-10 12:37:43,219] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. + 2: [2023-05-10 12:37:43,219] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. + 2: [2023-05-10 12:37:43,220] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt... +28: [2023-05-10 12:37:43,220] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt... +27: [2023-05-10 12:37:43,220] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... + 2: [2023-05-10 12:37:43,220] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt... +28: [2023-05-10 12:37:43,221] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +28: [2023-05-10 12:37:43,221] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt... +17: [2023-05-10 12:37:43,221] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt. +17: [2023-05-10 12:37:43,221] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt. +17: [2023-05-10 12:37:43,221] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt. +28: [2023-05-10 12:37:43,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +28: [2023-05-10 12:37:43,222] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt... +17: [2023-05-10 12:37:43,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt. +15: [2023-05-10 12:37:43,221] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +15: [2023-05-10 12:37:43,222] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt... +10: [2023-05-10 12:37:43,222] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +15: [2023-05-10 12:37:43,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +15: [2023-05-10 12:37:43,222] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt... + 6: [2023-05-10 12:37:43,222] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +15: [2023-05-10 12:37:43,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. +15: [2023-05-10 12:37:43,223] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt... + 6: [2023-05-10 12:37:43,223] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... + 9: [2023-05-10 12:37:43,223] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +29: [2023-05-10 12:37:43,223] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... + 2: [2023-05-10 12:37:43,224] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. + 6: [2023-05-10 12:37:43,224] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... + 2: [2023-05-10 12:37:43,224] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt... +17: [2023-05-10 12:37:43,225] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. + 2: [2023-05-10 12:37:43,225] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_00-model_states.pt. + 2: [2023-05-10 12:37:43,225] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt... + 9: [2023-05-10 12:37:43,225] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. + 8: [2023-05-10 12:37:43,224] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt. + 8: [2023-05-10 12:37:43,224] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt. + 8: [2023-05-10 12:37:43,225] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt. + 8: [2023-05-10 12:37:43,225] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt. +27: [2023-05-10 12:37:43,226] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. + 8: [2023-05-10 12:37:43,226] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. + 8: [2023-05-10 12:37:43,226] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. + 8: [2023-05-10 12:37:43,227] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... + 8: [2023-05-10 12:37:43,227] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +29: [2023-05-10 12:37:43,227] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +10: [2023-05-10 12:37:43,227] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. + 1: [2023-05-10 12:37:43,227] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. + 1: [2023-05-10 12:37:43,227] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. + 1: [2023-05-10 12:37:43,227] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... + 1: [2023-05-10 12:37:43,227] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +10: [2023-05-10 12:37:43,228] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. + 6: [2023-05-10 12:37:43,229] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +29: [2023-05-10 12:37:43,229] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +29: [2023-05-10 12:37:43,229] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... + 6: [2023-05-10 12:37:43,230] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... + 6: [2023-05-10 12:37:43,230] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... + 1: [2023-05-10 12:37:43,230] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. + 1: [2023-05-10 12:37:43,230] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. + 1: [2023-05-10 12:37:43,230] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... + 1: [2023-05-10 12:37:43,230] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +28: [2023-05-10 12:37:43,230] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. + 6: [2023-05-10 12:37:43,231] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. + 8: [2023-05-10 12:37:43,231] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +27: [2023-05-10 12:37:43,231] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +26: [2023-05-10 12:37:43,231] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +26: [2023-05-10 12:37:43,231] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +26: [2023-05-10 12:37:43,231] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +26: [2023-05-10 12:37:43,231] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +26: [2023-05-10 12:37:43,231] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. + 6: [2023-05-10 12:37:43,232] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +26: [2023-05-10 12:37:43,232] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +26: [2023-05-10 12:37:43,232] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +28: [2023-05-10 12:37:43,232] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt... +26: [2023-05-10 12:37:43,232] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +17: [2023-05-10 12:37:43,232] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +11: [2023-05-10 12:37:43,231] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +17: [2023-05-10 12:37:43,232] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +11: [2023-05-10 12:37:43,232] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt... + 9: [2023-05-10 12:37:43,232] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... + 8: [2023-05-10 12:37:43,232] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +31: [2023-05-10 12:37:43,232] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt. +31: [2023-05-10 12:37:43,232] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt. +31: [2023-05-10 12:37:43,232] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt. +31: [2023-05-10 12:37:43,232] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt. + 9: [2023-05-10 12:37:43,234] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +17: [2023-05-10 12:37:43,234] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +17: [2023-05-10 12:37:43,234] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +27: [2023-05-10 12:37:43,234] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +11: [2023-05-10 12:37:43,234] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +11: [2023-05-10 12:37:43,235] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt... +11: [2023-05-10 12:37:43,235] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +17: [2023-05-10 12:37:43,235] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +11: [2023-05-10 12:37:43,235] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt... +10: [2023-05-10 12:37:43,236] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... + 8: [2023-05-10 12:37:43,232] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... + 8: [2023-05-10 12:37:43,233] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... + 8: [2023-05-10 12:37:43,234] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... + 8: [2023-05-10 12:37:43,238] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... + 8: [2023-05-10 12:37:43,238] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +10: [2023-05-10 12:37:43,238] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... + 6: [2023-05-10 12:37:43,240] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +27: [2023-05-10 12:37:43,240] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... + 8: [2023-05-10 12:37:43,240] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +31: [2023-05-10 12:37:43,241] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +31: [2023-05-10 12:37:43,241] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +31: [2023-05-10 12:37:43,243] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +31: [2023-05-10 12:37:43,243] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... + 1: [2023-05-10 12:37:43,243] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. + 1: [2023-05-10 12:37:43,243] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +11: [2023-05-10 12:37:43,243] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +26: [2023-05-10 12:37:43,244] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. + 1: [2023-05-10 12:37:43,244] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +26: [2023-05-10 12:37:43,245] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +11: [2023-05-10 12:37:43,245] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt... +29: [2023-05-10 12:37:43,247] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt. +29: [2023-05-10 12:37:43,247] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt. +29: [2023-05-10 12:37:43,247] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt. +29: [2023-05-10 12:37:43,248] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt. +26: [2023-05-10 12:37:43,248] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +17: [2023-05-10 12:37:43,249] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +17: [2023-05-10 12:37:43,249] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +17: [2023-05-10 12:37:43,249] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt... +17: [2023-05-10 12:37:43,249] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt... +26: [2023-05-10 12:37:43,250] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. + 6: [2023-05-10 12:37:43,251] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. + 8: [2023-05-10 12:37:43,251] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. + 6: [2023-05-10 12:37:43,251] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt... + 8: [2023-05-10 12:37:43,252] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt... + 6: [2023-05-10 12:37:43,252] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +31: [2023-05-10 12:37:43,252] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. + 6: [2023-05-10 12:37:43,252] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt... + 6: [2023-05-10 12:37:43,253] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. + 1: [2023-05-10 12:37:43,253] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... + 6: [2023-05-10 12:37:43,253] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt... + 1: [2023-05-10 12:37:43,253] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... + 1: [2023-05-10 12:37:43,254] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. + 1: [2023-05-10 12:37:43,254] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +26: [2023-05-10 12:37:43,254] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +31: [2023-05-10 12:37:43,256] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt... +14: [2023-05-10 12:37:43,257] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt. +14: [2023-05-10 12:37:43,257] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt. +26: [2023-05-10 12:37:43,257] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... + 8: [2023-05-10 12:37:43,257] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. + 8: [2023-05-10 12:37:43,257] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +29: [2023-05-10 12:37:43,258] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +14: [2023-05-10 12:37:43,258] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt. +29: [2023-05-10 12:37:43,258] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +14: [2023-05-10 12:37:43,258] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt. +29: [2023-05-10 12:37:43,260] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +29: [2023-05-10 12:37:43,260] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... + 6: [2023-05-10 12:37:43,260] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +17: [2023-05-10 12:37:43,260] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +31: [2023-05-10 12:37:43,260] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +31: [2023-05-10 12:37:43,260] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt... +26: [2023-05-10 12:37:43,260] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +26: [2023-05-10 12:37:43,261] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... + 8: [2023-05-10 12:37:43,260] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. + 8: [2023-05-10 12:37:43,261] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt... +17: [2023-05-10 12:37:43,261] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt... + 6: [2023-05-10 12:37:43,261] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt... + 1: [2023-05-10 12:37:43,263] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... + 8: [2023-05-10 12:37:43,263] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. + 8: [2023-05-10 12:37:43,264] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +31: [2023-05-10 12:37:43,264] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +31: [2023-05-10 12:37:43,264] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt... +17: [2023-05-10 12:37:43,264] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +31: [2023-05-10 12:37:43,265] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +31: [2023-05-10 12:37:43,265] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt... + 3: [2023-05-10 12:37:43,266] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt. + 3: [2023-05-10 12:37:43,266] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt. + 3: [2023-05-10 12:37:43,266] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt. +17: [2023-05-10 12:37:43,266] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt... + 3: [2023-05-10 12:37:43,266] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt. +30: [2023-05-10 12:37:43,267] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt. +30: [2023-05-10 12:37:43,268] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt. + 8: [2023-05-10 12:37:43,269] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +14: [2023-05-10 12:37:43,269] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +14: [2023-05-10 12:37:43,269] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +14: [2023-05-10 12:37:43,269] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +30: [2023-05-10 12:37:43,271] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt. +29: [2023-05-10 12:37:43,271] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +29: [2023-05-10 12:37:43,271] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt... +30: [2023-05-10 12:37:43,271] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt. +14: [2023-05-10 12:37:43,272] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... + 8: [2023-05-10 12:37:43,272] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... + 8: [2023-05-10 12:37:43,273] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +23: [2023-05-10 12:37:43,274] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt. +23: [2023-05-10 12:37:43,274] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt. +23: [2023-05-10 12:37:43,274] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt. + 8: [2023-05-10 12:37:43,274] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt... +23: [2023-05-10 12:37:43,274] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt. + 3: [2023-05-10 12:37:43,275] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... + 3: [2023-05-10 12:37:43,275] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... + 8: [2023-05-10 12:37:43,276] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... + 8: [2023-05-10 12:37:43,276] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... + 3: [2023-05-10 12:37:43,277] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +30: [2023-05-10 12:37:43,277] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... + 3: [2023-05-10 12:37:43,278] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +30: [2023-05-10 12:37:43,278] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... + 7: [2023-05-10 12:37:43,280] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt. + 7: [2023-05-10 12:37:43,280] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt. +30: [2023-05-10 12:37:43,281] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... + 7: [2023-05-10 12:37:43,280] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt. + 7: [2023-05-10 12:37:43,280] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt. + 8: [2023-05-10 12:37:43,281] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +29: [2023-05-10 12:37:43,281] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +29: [2023-05-10 12:37:43,281] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt... +30: [2023-05-10 12:37:43,281] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... + 8: [2023-05-10 12:37:43,283] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt... +23: [2023-05-10 12:37:43,283] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +23: [2023-05-10 12:37:43,283] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +23: [2023-05-10 12:37:43,286] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +23: [2023-05-10 12:37:43,286] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +29: [2023-05-10 12:37:43,286] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +29: [2023-05-10 12:37:43,287] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +29: [2023-05-10 12:37:43,288] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt... +29: [2023-05-10 12:37:43,288] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt... + 7: [2023-05-10 12:37:43,289] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... + 7: [2023-05-10 12:37:43,290] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... + 3: [2023-05-10 12:37:43,291] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. + 3: [2023-05-10 12:37:43,291] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. + 7: [2023-05-10 12:37:43,292] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... + 7: [2023-05-10 12:37:43,292] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... + 3: [2023-05-10 12:37:43,293] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt... + 3: [2023-05-10 12:37:43,293] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt... +27: [2023-05-10 12:37:43,293] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt. +27: [2023-05-10 12:37:43,293] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt. +27: [2023-05-10 12:37:43,293] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt. +20: [2023-05-10 12:37:43,293] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt. +27: [2023-05-10 12:37:43,294] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt. +20: [2023-05-10 12:37:43,294] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt. +20: [2023-05-10 12:37:43,294] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt. + 0: [2023-05-10 12:37:43,294] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt. + 0: [2023-05-10 12:37:43,294] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt. + 0: [2023-05-10 12:37:43,294] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt. +18: [2023-05-10 12:37:43,294] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. + 0: [2023-05-10 12:37:43,294] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt. +18: [2023-05-10 12:37:43,294] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +18: [2023-05-10 12:37:43,294] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +18: [2023-05-10 12:37:43,294] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +18: [2023-05-10 12:37:43,294] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +20: [2023-05-10 12:37:43,294] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt. +18: [2023-05-10 12:37:43,294] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +18: [2023-05-10 12:37:43,295] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +12: [2023-05-10 12:37:43,295] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt. +12: [2023-05-10 12:37:43,295] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt. +12: [2023-05-10 12:37:43,295] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt. +12: [2023-05-10 12:37:43,296] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt. +18: [2023-05-10 12:37:43,296] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +22: [2023-05-10 12:37:43,297] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt. +22: [2023-05-10 12:37:43,297] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt. +21: [2023-05-10 12:37:43,297] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt. +21: [2023-05-10 12:37:43,297] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt. +21: [2023-05-10 12:37:43,297] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt. +21: [2023-05-10 12:37:43,298] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt. +22: [2023-05-10 12:37:43,298] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt. +22: [2023-05-10 12:37:43,298] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt. +23: [2023-05-10 12:37:43,299] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +13: [2023-05-10 12:37:43,299] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt. +16: [2023-05-10 12:37:43,300] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt. +16: [2023-05-10 12:37:43,300] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt. +16: [2023-05-10 12:37:43,300] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt. +13: [2023-05-10 12:37:43,300] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt. +16: [2023-05-10 12:37:43,300] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt. +13: [2023-05-10 12:37:43,300] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt. +13: [2023-05-10 12:37:43,300] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt. +23: [2023-05-10 12:37:43,301] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt... + 3: [2023-05-10 12:37:43,301] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. + 9: [2023-05-10 12:37:43,301] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt. + 9: [2023-05-10 12:37:43,301] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt. + 9: [2023-05-10 12:37:43,301] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt. + 3: [2023-05-10 12:37:43,302] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt... +27: [2023-05-10 12:37:43,303] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +27: [2023-05-10 12:37:43,303] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... + 7: [2023-05-10 12:37:43,302] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +27: [2023-05-10 12:37:43,303] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +23: [2023-05-10 12:37:43,303] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. + 7: [2023-05-10 12:37:43,303] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt... +27: [2023-05-10 12:37:43,303] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +23: [2023-05-10 12:37:43,303] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt... +24: [2023-05-10 12:37:43,303] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt. +24: [2023-05-10 12:37:43,303] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt. +24: [2023-05-10 12:37:43,303] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt. + 7: [2023-05-10 12:37:43,303] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. + 7: [2023-05-10 12:37:43,303] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt... + 5: [2023-05-10 12:37:43,304] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt. + 0: [2023-05-10 12:37:43,304] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... + 0: [2023-05-10 12:37:43,304] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +19: [2023-05-10 12:37:43,304] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt. + 5: [2023-05-10 12:37:43,304] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt. + 0: [2023-05-10 12:37:43,304] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +19: [2023-05-10 12:37:43,304] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt. +20: [2023-05-10 12:37:43,304] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +20: [2023-05-10 12:37:43,305] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +25: [2023-05-10 12:37:43,305] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt. +25: [2023-05-10 12:37:43,305] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt. +12: [2023-05-10 12:37:43,305] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +25: [2023-05-10 12:37:43,305] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt. +20: [2023-05-10 12:37:43,305] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +24: [2023-05-10 12:37:43,305] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt. + 9: [2023-05-10 12:37:43,305] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt. +25: [2023-05-10 12:37:43,305] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt. +20: [2023-05-10 12:37:43,305] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... + 3: [2023-05-10 12:37:43,306] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +19: [2023-05-10 12:37:43,306] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt. +19: [2023-05-10 12:37:43,306] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt. +21: [2023-05-10 12:37:43,307] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... + 0: [2023-05-10 12:37:43,307] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +21: [2023-05-10 12:37:43,307] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... + 5: [2023-05-10 12:37:43,307] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt. +12: [2023-05-10 12:37:43,308] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +21: [2023-05-10 12:37:43,308] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... + 3: [2023-05-10 12:37:43,308] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt... +12: [2023-05-10 12:37:43,308] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +12: [2023-05-10 12:37:43,308] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +13: [2023-05-10 12:37:43,308] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +13: [2023-05-10 12:37:43,308] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +13: [2023-05-10 12:37:43,308] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +13: [2023-05-10 12:37:43,308] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +13: [2023-05-10 12:37:43,309] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... + 5: [2023-05-10 12:37:43,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt. +22: [2023-05-10 12:37:43,309] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +22: [2023-05-10 12:37:43,309] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +22: [2023-05-10 12:37:43,309] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +13: [2023-05-10 12:37:43,310] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +13: [2023-05-10 12:37:43,310] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +21: [2023-05-10 12:37:43,310] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +13: [2023-05-10 12:37:43,310] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... + 9: [2023-05-10 12:37:43,310] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +13: [2023-05-10 12:37:43,311] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +13: [2023-05-10 12:37:43,311] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +13: [2023-05-10 12:37:43,311] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +13: [2023-05-10 12:37:43,311] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +16: [2023-05-10 12:37:43,311] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +16: [2023-05-10 12:37:43,311] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +16: [2023-05-10 12:37:43,311] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +16: [2023-05-10 12:37:43,311] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +22: [2023-05-10 12:37:43,312] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... + 9: [2023-05-10 12:37:43,312] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... + 9: [2023-05-10 12:37:43,313] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +23: [2023-05-10 12:37:43,313] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +24: [2023-05-10 12:37:43,314] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... + 7: [2023-05-10 12:37:43,314] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. + 1: [2023-05-10 12:37:43,314] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt. + 1: [2023-05-10 12:37:43,314] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt. + 1: [2023-05-10 12:37:43,314] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt. + 1: [2023-05-10 12:37:43,315] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt. +25: [2023-05-10 12:37:43,315] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +23: [2023-05-10 12:37:43,315] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt... +25: [2023-05-10 12:37:43,315] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +23: [2023-05-10 12:37:43,316] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +14: [2023-05-10 12:37:43,316] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. + 7: [2023-05-10 12:37:43,316] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt... + 9: [2023-05-10 12:37:43,316] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +25: [2023-05-10 12:37:43,316] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +14: [2023-05-10 12:37:43,316] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +14: [2023-05-10 12:37:43,316] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +25: [2023-05-10 12:37:43,316] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +24: [2023-05-10 12:37:43,316] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +27: [2023-05-10 12:37:43,316] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +14: [2023-05-10 12:37:43,317] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt... +24: [2023-05-10 12:37:43,317] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... + 5: [2023-05-10 12:37:43,317] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... + 5: [2023-05-10 12:37:43,317] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +14: [2023-05-10 12:37:43,317] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +27: [2023-05-10 12:37:43,317] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt... +14: [2023-05-10 12:37:43,317] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +14: [2023-05-10 12:37:43,317] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +14: [2023-05-10 12:37:43,317] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt... +14: [2023-05-10 12:37:43,317] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +24: [2023-05-10 12:37:43,317] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +14: [2023-05-10 12:37:43,317] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +14: [2023-05-10 12:37:43,317] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +14: [2023-05-10 12:37:43,317] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +19: [2023-05-10 12:37:43,318] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +23: [2023-05-10 12:37:43,318] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt... +14: [2023-05-10 12:37:43,319] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt... +14: [2023-05-10 12:37:43,319] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt... +14: [2023-05-10 12:37:43,319] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +14: [2023-05-10 12:37:43,319] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... + 0: [2023-05-10 12:37:43,319] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. + 7: [2023-05-10 12:37:43,319] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +12: [2023-05-10 12:37:43,320] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. + 5: [2023-05-10 12:37:43,320] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... + 0: [2023-05-10 12:37:43,320] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt... +12: [2023-05-10 12:37:43,320] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +12: [2023-05-10 12:37:43,320] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +12: [2023-05-10 12:37:43,320] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +12: [2023-05-10 12:37:43,320] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +12: [2023-05-10 12:37:43,320] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +12: [2023-05-10 12:37:43,320] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +18: [2023-05-10 12:37:43,320] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +18: [2023-05-10 12:37:43,320] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. + 5: [2023-05-10 12:37:43,320] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +12: [2023-05-10 12:37:43,320] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +23: [2023-05-10 12:37:43,321] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +19: [2023-05-10 12:37:43,319] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +19: [2023-05-10 12:37:43,320] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +23: [2023-05-10 12:37:43,321] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +18: [2023-05-10 12:37:43,321] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +23: [2023-05-10 12:37:43,321] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +23: [2023-05-10 12:37:43,321] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +12: [2023-05-10 12:37:43,321] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt... +23: [2023-05-10 12:37:43,321] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +23: [2023-05-10 12:37:43,321] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +19: [2023-05-10 12:37:43,321] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +12: [2023-05-10 12:37:43,322] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +23: [2023-05-10 12:37:43,322] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +23: [2023-05-10 12:37:43,322] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... + 7: [2023-05-10 12:37:43,322] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt... + 2: [2023-05-10 12:37:43,322] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +21: [2023-05-10 12:37:43,322] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +21: [2023-05-10 12:37:43,322] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +21: [2023-05-10 12:37:43,322] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +21: [2023-05-10 12:37:43,322] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... + 2: [2023-05-10 12:37:43,322] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. + 2: [2023-05-10 12:37:43,322] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. + 2: [2023-05-10 12:37:43,322] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... + 2: [2023-05-10 12:37:43,322] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... + 2: [2023-05-10 12:37:43,322] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... + 0: [2023-05-10 12:37:43,323] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. + 0: [2023-05-10 12:37:43,323] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +21: [2023-05-10 12:37:43,323] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. + 0: [2023-05-10 12:37:43,323] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... + 0: [2023-05-10 12:37:43,323] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... + 2: [2023-05-10 12:37:43,323] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +30: [2023-05-10 12:37:43,323] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +30: [2023-05-10 12:37:43,323] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. + 2: [2023-05-10 12:37:43,323] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +30: [2023-05-10 12:37:43,323] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +30: [2023-05-10 12:37:43,323] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +30: [2023-05-10 12:37:43,323] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +30: [2023-05-10 12:37:43,323] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +30: [2023-05-10 12:37:43,323] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +30: [2023-05-10 12:37:43,323] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +30: [2023-05-10 12:37:43,323] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +30: [2023-05-10 12:37:43,323] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +30: [2023-05-10 12:37:43,323] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt... +30: [2023-05-10 12:37:43,323] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +30: [2023-05-10 12:37:43,323] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt... +30: [2023-05-10 12:37:43,323] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt... +30: [2023-05-10 12:37:43,324] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +30: [2023-05-10 12:37:43,324] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt... +21: [2023-05-10 12:37:43,324] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt... +21: [2023-05-10 12:37:43,324] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. + 0: [2023-05-10 12:37:43,324] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. + 1: [2023-05-10 12:37:43,324] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... + 1: [2023-05-10 12:37:43,324] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... + 0: [2023-05-10 12:37:43,324] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +27: [2023-05-10 12:37:43,324] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. + 0: [2023-05-10 12:37:43,324] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +27: [2023-05-10 12:37:43,324] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt... +12: [2023-05-10 12:37:43,324] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +12: [2023-05-10 12:37:43,325] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt... +21: [2023-05-10 12:37:43,325] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. + 0: [2023-05-10 12:37:43,325] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +12: [2023-05-10 12:37:43,325] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +12: [2023-05-10 12:37:43,325] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt... + 0: [2023-05-10 12:37:43,325] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt... +13: [2023-05-10 12:37:43,325] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +21: [2023-05-10 12:37:43,326] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +15: [2023-05-10 12:37:43,327] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +15: [2023-05-10 12:37:43,327] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +15: [2023-05-10 12:37:43,327] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +15: [2023-05-10 12:37:43,327] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... + 1: [2023-05-10 12:37:43,327] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +13: [2023-05-10 12:37:43,327] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt... + 1: [2023-05-10 12:37:43,327] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +21: [2023-05-10 12:37:43,327] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +15: [2023-05-10 12:37:43,327] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +15: [2023-05-10 12:37:43,327] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +13: [2023-05-10 12:37:43,327] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +13: [2023-05-10 12:37:43,327] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt... +21: [2023-05-10 12:37:43,327] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +21: [2023-05-10 12:37:43,327] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +21: [2023-05-10 12:37:43,327] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt... +21: [2023-05-10 12:37:43,328] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt... +16: [2023-05-10 12:37:43,327] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +22: [2023-05-10 12:37:43,327] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +22: [2023-05-10 12:37:43,327] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +22: [2023-05-10 12:37:43,327] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +18: [2023-05-10 12:37:43,328] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +22: [2023-05-10 12:37:43,328] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +22: [2023-05-10 12:37:43,328] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +22: [2023-05-10 12:37:43,328] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +22: [2023-05-10 12:37:43,328] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +22: [2023-05-10 12:37:43,328] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +22: [2023-05-10 12:37:43,328] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +16: [2023-05-10 12:37:43,328] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +27: [2023-05-10 12:37:43,328] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. + 0: [2023-05-10 12:37:43,328] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +15: [2023-05-10 12:37:43,329] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +16: [2023-05-10 12:37:43,329] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt... +15: [2023-05-10 12:37:43,329] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +16: [2023-05-10 12:37:43,329] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt... +22: [2023-05-10 12:37:43,329] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +22: [2023-05-10 12:37:43,329] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +25: [2023-05-10 12:37:43,329] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +27: [2023-05-10 12:37:43,329] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt... +22: [2023-05-10 12:37:43,330] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt... +22: [2023-05-10 12:37:43,330] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt... +22: [2023-05-10 12:37:43,330] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt... +12: [2023-05-10 12:37:43,330] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. + 9: [2023-05-10 12:37:43,330] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +12: [2023-05-10 12:37:43,330] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt... +14: [2023-05-10 12:37:43,330] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +18: [2023-05-10 12:37:43,330] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +19: [2023-05-10 12:37:43,330] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +19: [2023-05-10 12:37:43,330] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +25: [2023-05-10 12:37:43,330] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +19: [2023-05-10 12:37:43,330] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +19: [2023-05-10 12:37:43,330] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... + 9: [2023-05-10 12:37:43,330] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt... +14: [2023-05-10 12:37:43,330] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +25: [2023-05-10 12:37:43,331] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt... +25: [2023-05-10 12:37:43,331] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt... +19: [2023-05-10 12:37:43,331] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +19: [2023-05-10 12:37:43,331] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +27: [2023-05-10 12:37:43,331] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. + 0: [2023-05-10 12:37:43,332] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +23: [2023-05-10 12:37:43,333] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +27: [2023-05-10 12:37:43,333] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt... +19: [2023-05-10 12:37:43,333] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +16: [2023-05-10 12:37:43,333] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +16: [2023-05-10 12:37:43,333] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt... +18: [2023-05-10 12:37:43,333] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +19: [2023-05-10 12:37:43,334] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +18: [2023-05-10 12:37:43,334] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... + 0: [2023-05-10 12:37:43,334] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt... + 9: [2023-05-10 12:37:43,334] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. + 9: [2023-05-10 12:37:43,334] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt... + 2: [2023-05-10 12:37:43,335] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +30: [2023-05-10 12:37:43,335] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +12: [2023-05-10 12:37:43,336] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +16: [2023-05-10 12:37:43,336] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +16: [2023-05-10 12:37:43,336] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +16: [2023-05-10 12:37:43,336] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +16: [2023-05-10 12:37:43,336] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +16: [2023-05-10 12:37:43,336] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +16: [2023-05-10 12:37:43,336] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. + 9: [2023-05-10 12:37:43,336] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +23: [2023-05-10 12:37:43,336] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +24: [2023-05-10 12:37:43,336] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. + 9: [2023-05-10 12:37:43,336] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt... + 9: [2023-05-10 12:37:43,336] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. + 9: [2023-05-10 12:37:43,336] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt... +11: [2023-05-10 12:37:43,337] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +11: [2023-05-10 12:37:43,337] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +11: [2023-05-10 12:37:43,337] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. + 5: [2023-05-10 12:37:43,337] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. + 5: [2023-05-10 12:37:43,337] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +23: [2023-05-10 12:37:43,337] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +21: [2023-05-10 12:37:43,337] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +11: [2023-05-10 12:37:43,337] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +11: [2023-05-10 12:37:43,337] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +18: [2023-05-10 12:37:43,337] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... + 5: [2023-05-10 12:37:43,337] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. + 5: [2023-05-10 12:37:43,337] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. + 5: [2023-05-10 12:37:43,337] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +16: [2023-05-10 12:37:43,337] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +12: [2023-05-10 12:37:43,337] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +12: [2023-05-10 12:37:43,337] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. + 5: [2023-05-10 12:37:43,338] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt... +16: [2023-05-10 12:37:43,338] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +13: [2023-05-10 12:37:43,338] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. + 5: [2023-05-10 12:37:43,338] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt... +20: [2023-05-10 12:37:43,338] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +11: [2023-05-10 12:37:43,338] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... + 5: [2023-05-10 12:37:43,338] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. + 5: [2023-05-10 12:37:43,338] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +11: [2023-05-10 12:37:43,338] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +20: [2023-05-10 12:37:43,338] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +20: [2023-05-10 12:37:43,338] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. + 5: [2023-05-10 12:37:43,338] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +20: [2023-05-10 12:37:43,338] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +20: [2023-05-10 12:37:43,338] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +20: [2023-05-10 12:37:43,338] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. + 5: [2023-05-10 12:37:43,338] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +20: [2023-05-10 12:37:43,338] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +20: [2023-05-10 12:37:43,338] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +20: [2023-05-10 12:37:43,338] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt... +20: [2023-05-10 12:37:43,338] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt... +20: [2023-05-10 12:37:43,338] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +20: [2023-05-10 12:37:43,338] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt... +20: [2023-05-10 12:37:43,338] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +20: [2023-05-10 12:37:43,339] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt... +20: [2023-05-10 12:37:43,339] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +20: [2023-05-10 12:37:43,339] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +15: [2023-05-10 12:37:43,339] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +25: [2023-05-10 12:37:43,339] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +30: [2023-05-10 12:37:43,339] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +16: [2023-05-10 12:37:43,339] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. + 2: [2023-05-10 12:37:43,339] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. + 2: [2023-05-10 12:37:43,339] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. + 2: [2023-05-10 12:37:43,339] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +14: [2023-05-10 12:37:43,339] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +11: [2023-05-10 12:37:43,339] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +14: [2023-05-10 12:37:43,340] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... + 5: [2023-05-10 12:37:43,340] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. + 5: [2023-05-10 12:37:43,340] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt... +22: [2023-05-10 12:37:43,340] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +13: [2023-05-10 12:37:43,340] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +23: [2023-05-10 12:37:43,340] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +19: [2023-05-10 12:37:43,340] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. + 5: [2023-05-10 12:37:43,340] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +24: [2023-05-10 12:37:43,340] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt... +25: [2023-05-10 12:37:43,340] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. + 5: [2023-05-10 12:37:43,340] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. + 1: [2023-05-10 12:37:43,340] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +25: [2023-05-10 12:37:43,340] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt... + 5: [2023-05-10 12:37:43,340] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt... +19: [2023-05-10 12:37:43,341] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. + 1: [2023-05-10 12:37:43,341] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt... +19: [2023-05-10 12:37:43,341] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +19: [2023-05-10 12:37:43,341] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt... +19: [2023-05-10 12:37:43,341] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt... +19: [2023-05-10 12:37:43,341] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt... +24: [2023-05-10 12:37:43,341] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +22: [2023-05-10 12:37:43,341] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt... +16: [2023-05-10 12:37:43,341] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt... + 1: [2023-05-10 12:37:43,341] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +25: [2023-05-10 12:37:43,341] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt... + 1: [2023-05-10 12:37:43,342] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt... +24: [2023-05-10 12:37:43,342] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +13: [2023-05-10 12:37:43,342] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +13: [2023-05-10 12:37:43,342] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +21: [2023-05-10 12:37:43,342] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +13: [2023-05-10 12:37:43,342] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt... +13: [2023-05-10 12:37:43,342] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt... +21: [2023-05-10 12:37:43,342] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +24: [2023-05-10 12:37:43,342] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt... +23: [2023-05-10 12:37:43,342] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +24: [2023-05-10 12:37:43,342] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +14: [2023-05-10 12:37:43,342] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +15: [2023-05-10 12:37:43,343] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +30: [2023-05-10 12:37:43,343] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +24: [2023-05-10 12:37:43,343] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt... +30: [2023-05-10 12:37:43,343] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +24: [2023-05-10 12:37:43,344] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt... +22: [2023-05-10 12:37:43,344] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +21: [2023-05-10 12:37:43,344] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt... +23: [2023-05-10 12:37:43,345] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... + 2: [2023-05-10 12:37:43,345] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +14: [2023-05-10 12:37:43,345] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +12: [2023-05-10 12:37:43,346] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +13: [2023-05-10 12:37:43,346] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +30: [2023-05-10 12:37:43,346] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... + 1: [2023-05-10 12:37:43,346] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +19: [2023-05-10 12:37:43,347] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +15: [2023-05-10 12:37:43,347] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... + 1: [2023-05-10 12:37:43,348] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt... +12: [2023-05-10 12:37:43,348] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +22: [2023-05-10 12:37:43,348] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +22: [2023-05-10 12:37:43,348] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +22: [2023-05-10 12:37:43,348] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +12: [2023-05-10 12:37:43,348] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... + 2: [2023-05-10 12:37:43,348] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +16: [2023-05-10 12:37:43,348] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +16: [2023-05-10 12:37:43,348] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +23: [2023-05-10 12:37:43,349] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... + 2: [2023-05-10 12:37:43,349] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... + 2: [2023-05-10 12:37:43,349] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +19: [2023-05-10 12:37:43,349] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +21: [2023-05-10 12:37:43,349] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +30: [2023-05-10 12:37:43,349] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +13: [2023-05-10 12:37:43,350] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +12: [2023-05-10 12:37:43,350] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. + 5: [2023-05-10 12:37:43,351] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +19: [2023-05-10 12:37:43,351] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt... + 1: [2023-05-10 12:37:43,351] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +14: [2023-05-10 12:37:43,352] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +13: [2023-05-10 12:37:43,352] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +30: [2023-05-10 12:37:43,352] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +19: [2023-05-10 12:37:43,352] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. + 0: [2023-05-10 12:37:43,352] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +15: [2023-05-10 12:37:43,352] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... + 0: [2023-05-10 12:37:43,353] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. + 0: [2023-05-10 12:37:43,353] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. + 0: [2023-05-10 12:37:43,353] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. + 5: [2023-05-10 12:37:43,353] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +23: [2023-05-10 12:37:43,353] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +20: [2023-05-10 12:37:43,352] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +20: [2023-05-10 12:37:43,353] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. + 1: [2023-05-10 12:37:43,353] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt... +11: [2023-05-10 12:37:43,353] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +20: [2023-05-10 12:37:43,354] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +20: [2023-05-10 12:37:43,354] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +30: [2023-05-10 12:37:43,354] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +22: [2023-05-10 12:37:43,354] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +26: [2023-05-10 12:37:43,354] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt. +26: [2023-05-10 12:37:43,354] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt. +14: [2023-05-10 12:37:43,354] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... + 4: [2023-05-10 12:37:43,354] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt. + 4: [2023-05-10 12:37:43,354] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt. + 4: [2023-05-10 12:37:43,354] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt. + 4: [2023-05-10 12:37:43,354] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt. + 0: [2023-05-10 12:37:43,355] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt... +21: [2023-05-10 12:37:43,355] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +11: [2023-05-10 12:37:43,355] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +15: [2023-05-10 12:37:43,355] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +18: [2023-05-10 12:37:43,355] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt. +18: [2023-05-10 12:37:43,355] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt. +18: [2023-05-10 12:37:43,355] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt. +10: [2023-05-10 12:37:43,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt. +10: [2023-05-10 12:37:43,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt. +18: [2023-05-10 12:37:43,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt. +10: [2023-05-10 12:37:43,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt. +13: [2023-05-10 12:37:43,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +15: [2023-05-10 12:37:43,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt. +15: [2023-05-10 12:37:43,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt. +15: [2023-05-10 12:37:43,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt. +22: [2023-05-10 12:37:43,357] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +10: [2023-05-10 12:37:43,357] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt. +26: [2023-05-10 12:37:43,357] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt. +19: [2023-05-10 12:37:43,358] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +22: [2023-05-10 12:37:43,358] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +22: [2023-05-10 12:37:43,358] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +26: [2023-05-10 12:37:43,358] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt. +21: [2023-05-10 12:37:43,358] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +12: [2023-05-10 12:37:43,359] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +16: [2023-05-10 12:37:43,359] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +15: [2023-05-10 12:37:43,360] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt. + 2: [2023-05-10 12:37:43,360] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt. + 2: [2023-05-10 12:37:43,360] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt. + 2: [2023-05-10 12:37:43,360] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt. + 2: [2023-05-10 12:37:43,360] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_18-model_01-model_states.pt. +13: [2023-05-10 12:37:43,361] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +21: [2023-05-10 12:37:43,361] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +16: [2023-05-10 12:37:43,362] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +20: [2023-05-10 12:37:43,362] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +11: [2023-05-10 12:37:43,362] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +16: [2023-05-10 12:37:43,362] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. + 5: [2023-05-10 12:37:43,363] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... + 5: [2023-05-10 12:37:43,363] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... + 4: [2023-05-10 12:37:43,363] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... + 4: [2023-05-10 12:37:43,363] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +19: [2023-05-10 12:37:43,363] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +11: [2023-05-10 12:37:43,364] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +11: [2023-05-10 12:37:43,364] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. + 5: [2023-05-10 12:37:43,364] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +19: [2023-05-10 12:37:43,364] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +18: [2023-05-10 12:37:43,364] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +18: [2023-05-10 12:37:43,364] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +10: [2023-05-10 12:37:43,364] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +11: [2023-05-10 12:37:43,364] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +10: [2023-05-10 12:37:43,364] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +19: [2023-05-10 12:37:43,365] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +13: [2023-05-10 12:37:43,365] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +20: [2023-05-10 12:37:43,365] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +18: [2023-05-10 12:37:43,365] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +26: [2023-05-10 12:37:43,365] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +15: [2023-05-10 12:37:43,365] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... + 0: [2023-05-10 12:37:43,365] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +20: [2023-05-10 12:37:43,365] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +20: [2023-05-10 12:37:43,365] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... + 4: [2023-05-10 12:37:43,366] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... + 4: [2023-05-10 12:37:43,366] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... + 0: [2023-05-10 12:37:43,366] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +18: [2023-05-10 12:37:43,367] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +15: [2023-05-10 12:37:43,367] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +26: [2023-05-10 12:37:43,366] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... + 0: [2023-05-10 12:37:43,367] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +21: [2023-05-10 12:37:43,367] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... + 5: [2023-05-10 12:37:43,367] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +10: [2023-05-10 12:37:43,367] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +15: [2023-05-10 12:37:43,367] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +15: [2023-05-10 12:37:43,368] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +15: [2023-05-10 12:37:43,368] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +26: [2023-05-10 12:37:43,368] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +16: [2023-05-10 12:37:43,369] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +26: [2023-05-10 12:37:43,369] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... + 2: [2023-05-10 12:37:43,369] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... + 2: [2023-05-10 12:37:43,369] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... + 2: [2023-05-10 12:37:43,369] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +21: [2023-05-10 12:37:43,369] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +15: [2023-05-10 12:37:43,370] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +10: [2023-05-10 12:37:43,371] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... +16: [2023-05-10 12:37:43,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +11: [2023-05-10 12:37:43,373] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +11: [2023-05-10 12:37:43,373] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... + 2: [2023-05-10 12:37:43,373] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt... + 5: [2023-05-10 12:37:43,373] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +19: [2023-05-10 12:37:43,375] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... + 5: [2023-05-10 12:37:43,376] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +15: [2023-05-10 12:37:43,377] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... + 0: [2023-05-10 12:37:43,377] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +16: [2023-05-10 12:37:43,377] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +19: [2023-05-10 12:37:43,378] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... + 4: [2023-05-10 12:37:43,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. + 4: [2023-05-10 12:37:43,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. + 4: [2023-05-10 12:37:43,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt... + 4: [2023-05-10 12:37:43,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt... +18: [2023-05-10 12:37:43,381] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +10: [2023-05-10 12:37:43,382] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +10: [2023-05-10 12:37:43,382] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +10: [2023-05-10 12:37:43,382] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt... +10: [2023-05-10 12:37:43,382] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt... +18: [2023-05-10 12:37:43,383] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt... +18: [2023-05-10 12:37:43,383] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. + 2: [2023-05-10 12:37:43,383] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +18: [2023-05-10 12:37:43,383] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt... +26: [2023-05-10 12:37:43,383] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. + 2: [2023-05-10 12:37:43,383] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt... +26: [2023-05-10 12:37:43,384] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt... + 2: [2023-05-10 12:37:43,384] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. + 2: [2023-05-10 12:37:43,385] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt... +18: [2023-05-10 12:37:43,385] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +26: [2023-05-10 12:37:43,385] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +18: [2023-05-10 12:37:43,385] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt... +26: [2023-05-10 12:37:43,385] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt... +15: [2023-05-10 12:37:43,384] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. + 0: [2023-05-10 12:37:43,386] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +15: [2023-05-10 12:37:43,387] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt... +15: [2023-05-10 12:37:43,387] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +15: [2023-05-10 12:37:43,387] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt... + 2: [2023-05-10 12:37:43,388] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. + 2: [2023-05-10 12:37:43,388] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt... +26: [2023-05-10 12:37:43,389] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +26: [2023-05-10 12:37:43,389] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt... +15: [2023-05-10 12:37:43,387] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +15: [2023-05-10 12:37:43,387] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt... +18: [2023-05-10 12:37:43,391] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +18: [2023-05-10 12:37:43,392] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt... +15: [2023-05-10 12:37:43,392] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. + 4: [2023-05-10 12:37:43,393] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. + 4: [2023-05-10 12:37:43,393] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +15: [2023-05-10 12:37:43,393] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt... +10: [2023-05-10 12:37:43,393] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +10: [2023-05-10 12:37:43,395] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt... + 4: [2023-05-10 12:37:43,395] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt... + 4: [2023-05-10 12:37:43,395] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt... + 2: [2023-05-10 12:37:43,396] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. + 2: [2023-05-10 12:37:43,396] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt... +26: [2023-05-10 12:37:43,398] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +10: [2023-05-10 12:37:43,398] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_00-model_states.pt. +11: [2023-05-10 12:37:43,399] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt. +11: [2023-05-10 12:37:43,399] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt. +10: [2023-05-10 12:37:43,400] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt... +26: [2023-05-10 12:37:43,400] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt... +11: [2023-05-10 12:37:43,401] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt. +11: [2023-05-10 12:37:43,402] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt. +11: [2023-05-10 12:37:43,408] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +11: [2023-05-10 12:37:43,409] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +11: [2023-05-10 12:37:43,411] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +11: [2023-05-10 12:37:43,411] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +11: [2023-05-10 12:37:43,420] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +11: [2023-05-10 12:37:43,421] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt... +11: [2023-05-10 12:37:43,423] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +11: [2023-05-10 12:37:43,423] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt... +11: [2023-05-10 12:37:43,424] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +11: [2023-05-10 12:37:43,424] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt... +11: [2023-05-10 12:37:43,425] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +11: [2023-05-10 12:37:43,426] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt... +28: [2023-05-10 12:37:43,429] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +28: [2023-05-10 12:37:43,430] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +28: [2023-05-10 12:37:43,430] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +28: [2023-05-10 12:37:43,430] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +28: [2023-05-10 12:37:43,430] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +28: [2023-05-10 12:37:43,431] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +28: [2023-05-10 12:37:43,431] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... + 8: [2023-05-10 12:37:43,431] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt. + 8: [2023-05-10 12:37:43,432] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt. + 8: [2023-05-10 12:37:43,433] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt. +28: [2023-05-10 12:37:43,433] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... + 8: [2023-05-10 12:37:43,434] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt. + 8: [2023-05-10 12:37:43,441] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... + 8: [2023-05-10 12:37:43,442] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... + 8: [2023-05-10 12:37:43,442] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... + 8: [2023-05-10 12:37:43,444] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +28: [2023-05-10 12:37:43,449] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +28: [2023-05-10 12:37:43,449] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +28: [2023-05-10 12:37:43,449] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. + 8: [2023-05-10 12:37:43,457] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. + 8: [2023-05-10 12:37:43,458] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt... +28: [2023-05-10 12:37:43,458] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +28: [2023-05-10 12:37:43,459] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... + 8: [2023-05-10 12:37:43,460] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. + 8: [2023-05-10 12:37:43,460] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt... + 8: [2023-05-10 12:37:43,461] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. + 8: [2023-05-10 12:37:43,461] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt... +28: [2023-05-10 12:37:43,461] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +17: [2023-05-10 12:37:43,463] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt. +17: [2023-05-10 12:37:43,463] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt. + 8: [2023-05-10 12:37:43,466] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. + 8: [2023-05-10 12:37:43,466] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt... +23: [2023-05-10 12:37:43,467] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt. +23: [2023-05-10 12:37:43,467] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt. + 3: [2023-05-10 12:37:43,468] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt. + 3: [2023-05-10 12:37:43,468] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt. +17: [2023-05-10 12:37:43,469] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt. +23: [2023-05-10 12:37:43,469] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt. +23: [2023-05-10 12:37:43,469] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt. + 6: [2023-05-10 12:37:43,470] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +28: [2023-05-10 12:37:43,470] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. + 6: [2023-05-10 12:37:43,470] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. + 6: [2023-05-10 12:37:43,470] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. + 6: [2023-05-10 12:37:43,470] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... + 6: [2023-05-10 12:37:43,470] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... + 6: [2023-05-10 12:37:43,470] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... + 7: [2023-05-10 12:37:43,470] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. + 7: [2023-05-10 12:37:43,470] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. + 7: [2023-05-10 12:37:43,470] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... + 7: [2023-05-10 12:37:43,470] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. + 7: [2023-05-10 12:37:43,470] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... + 6: [2023-05-10 12:37:43,470] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. + 6: [2023-05-10 12:37:43,470] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... + 7: [2023-05-10 12:37:43,471] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. + 7: [2023-05-10 12:37:43,471] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +17: [2023-05-10 12:37:43,471] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt. + 7: [2023-05-10 12:37:43,472] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... + 3: [2023-05-10 12:37:43,472] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt. + 3: [2023-05-10 12:37:43,473] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt. +17: [2023-05-10 12:37:43,476] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +17: [2023-05-10 12:37:43,476] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... + 4: [2023-05-10 12:37:43,476] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. + 4: [2023-05-10 12:37:43,476] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. + 4: [2023-05-10 12:37:43,477] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... + 4: [2023-05-10 12:37:43,477] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +23: [2023-05-10 12:37:43,477] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... + 3: [2023-05-10 12:37:43,477] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +23: [2023-05-10 12:37:43,478] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... + 4: [2023-05-10 12:37:43,478] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. + 4: [2023-05-10 12:37:43,478] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +17: [2023-05-10 12:37:43,478] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... + 4: [2023-05-10 12:37:43,478] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +28: [2023-05-10 12:37:43,479] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +23: [2023-05-10 12:37:43,479] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... + 4: [2023-05-10 12:37:43,479] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +23: [2023-05-10 12:37:43,479] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... + 3: [2023-05-10 12:37:43,480] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +17: [2023-05-10 12:37:43,481] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... + 7: [2023-05-10 12:37:43,483] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. + 6: [2023-05-10 12:37:43,484] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. + 3: [2023-05-10 12:37:43,485] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... + 3: [2023-05-10 12:37:43,485] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... + 0: [2023-05-10 12:37:43,486] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt. + 0: [2023-05-10 12:37:43,486] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt. +24: [2023-05-10 12:37:43,486] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. + 0: [2023-05-10 12:37:43,486] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt. +24: [2023-05-10 12:37:43,486] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +24: [2023-05-10 12:37:43,486] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +24: [2023-05-10 12:37:43,487] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... + 0: [2023-05-10 12:37:43,486] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt. + 7: [2023-05-10 12:37:43,486] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt. + 6: [2023-05-10 12:37:43,486] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. + 6: [2023-05-10 12:37:43,486] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. + 6: [2023-05-10 12:37:43,487] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. + 7: [2023-05-10 12:37:43,487] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt. +21: [2023-05-10 12:37:43,487] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt. +21: [2023-05-10 12:37:43,487] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt. +21: [2023-05-10 12:37:43,487] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt. +21: [2023-05-10 12:37:43,488] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt. +24: [2023-05-10 12:37:43,488] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +24: [2023-05-10 12:37:43,488] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +24: [2023-05-10 12:37:43,488] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +24: [2023-05-10 12:37:43,489] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... + 4: [2023-05-10 12:37:43,491] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. + 7: [2023-05-10 12:37:43,492] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt. + 7: [2023-05-10 12:37:43,492] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... + 7: [2023-05-10 12:37:43,492] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. + 7: [2023-05-10 12:37:43,492] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +23: [2023-05-10 12:37:43,493] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. + 7: [2023-05-10 12:37:43,494] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt. +17: [2023-05-10 12:37:43,495] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. + 4: [2023-05-10 12:37:43,495] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. + 4: [2023-05-10 12:37:43,495] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +17: [2023-05-10 12:37:43,495] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt... +25: [2023-05-10 12:37:43,495] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt. + 0: [2023-05-10 12:37:43,496] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... + 0: [2023-05-10 12:37:43,496] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +27: [2023-05-10 12:37:43,496] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt. +27: [2023-05-10 12:37:43,496] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt. + 3: [2023-05-10 12:37:43,496] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +16: [2023-05-10 12:37:43,496] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt. +16: [2023-05-10 12:37:43,496] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt. +16: [2023-05-10 12:37:43,496] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt. +23: [2023-05-10 12:37:43,496] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt... +23: [2023-05-10 12:37:43,496] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +23: [2023-05-10 12:37:43,497] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt... + 3: [2023-05-10 12:37:43,497] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt... +17: [2023-05-10 12:37:43,497] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. + 6: [2023-05-10 12:37:43,497] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +16: [2023-05-10 12:37:43,497] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt. + 0: [2023-05-10 12:37:43,497] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... + 7: [2023-05-10 12:37:43,497] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... + 6: [2023-05-10 12:37:43,497] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... + 6: [2023-05-10 12:37:43,497] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +17: [2023-05-10 12:37:43,497] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt... + 3: [2023-05-10 12:37:43,497] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +17: [2023-05-10 12:37:43,497] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +21: [2023-05-10 12:37:43,497] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... + 3: [2023-05-10 12:37:43,497] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt... +17: [2023-05-10 12:37:43,497] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt... +21: [2023-05-10 12:37:43,497] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... + 0: [2023-05-10 12:37:43,498] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... + 3: [2023-05-10 12:37:43,498] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. + 3: [2023-05-10 12:37:43,498] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt... +21: [2023-05-10 12:37:43,498] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... + 7: [2023-05-10 12:37:43,498] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +21: [2023-05-10 12:37:43,498] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +25: [2023-05-10 12:37:43,499] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt. +27: [2023-05-10 12:37:43,499] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt. +23: [2023-05-10 12:37:43,499] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. + 6: [2023-05-10 12:37:43,499] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +23: [2023-05-10 12:37:43,499] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt... +24: [2023-05-10 12:37:43,499] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +24: [2023-05-10 12:37:43,499] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +27: [2023-05-10 12:37:43,499] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt. +24: [2023-05-10 12:37:43,501] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +17: [2023-05-10 12:37:43,501] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. + 7: [2023-05-10 12:37:43,502] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +25: [2023-05-10 12:37:43,502] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt. +17: [2023-05-10 12:37:43,503] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt... +25: [2023-05-10 12:37:43,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt. +23: [2023-05-10 12:37:43,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +23: [2023-05-10 12:37:43,503] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt... + 7: [2023-05-10 12:37:43,504] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... + 7: [2023-05-10 12:37:43,504] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... + 4: [2023-05-10 12:37:43,504] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +25: [2023-05-10 12:37:43,504] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... + 7: [2023-05-10 12:37:43,505] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +27: [2023-05-10 12:37:43,506] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... + 4: [2023-05-10 12:37:43,506] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +27: [2023-05-10 12:37:43,506] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... + 4: [2023-05-10 12:37:43,507] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +16: [2023-05-10 12:37:43,508] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +25: [2023-05-10 12:37:43,508] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +27: [2023-05-10 12:37:43,508] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +16: [2023-05-10 12:37:43,508] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +16: [2023-05-10 12:37:43,508] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +16: [2023-05-10 12:37:43,508] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +27: [2023-05-10 12:37:43,508] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... + 3: [2023-05-10 12:37:43,508] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +24: [2023-05-10 12:37:43,509] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +24: [2023-05-10 12:37:43,509] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... + 4: [2023-05-10 12:37:43,510] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. + 7: [2023-05-10 12:37:43,510] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +24: [2023-05-10 12:37:43,510] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... + 3: [2023-05-10 12:37:43,510] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt... + 9: [2023-05-10 12:37:43,510] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt. + 9: [2023-05-10 12:37:43,510] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt. + 9: [2023-05-10 12:37:43,510] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt. + 9: [2023-05-10 12:37:43,511] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt. + 7: [2023-05-10 12:37:43,511] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +25: [2023-05-10 12:37:43,511] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... + 7: [2023-05-10 12:37:43,512] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt... +21: [2023-05-10 12:37:43,511] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +21: [2023-05-10 12:37:43,512] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. + 0: [2023-05-10 12:37:43,512] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +25: [2023-05-10 12:37:43,512] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +21: [2023-05-10 12:37:43,512] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt... +12: [2023-05-10 12:37:43,513] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt. +12: [2023-05-10 12:37:43,513] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt. +12: [2023-05-10 12:37:43,513] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt. +21: [2023-05-10 12:37:43,513] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt... +12: [2023-05-10 12:37:43,513] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt. + 0: [2023-05-10 12:37:43,514] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt... + 0: [2023-05-10 12:37:43,514] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. + 0: [2023-05-10 12:37:43,514] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt... + 0: [2023-05-10 12:37:43,515] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. + 0: [2023-05-10 12:37:43,515] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt... +21: [2023-05-10 12:37:43,518] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +21: [2023-05-10 12:37:43,518] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt... + 4: [2023-05-10 12:37:43,519] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +13: [2023-05-10 12:37:43,519] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt. +13: [2023-05-10 12:37:43,519] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt. + 9: [2023-05-10 12:37:43,519] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +25: [2023-05-10 12:37:43,520] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +24: [2023-05-10 12:37:43,520] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +21: [2023-05-10 12:37:43,520] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +13: [2023-05-10 12:37:43,520] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt. +13: [2023-05-10 12:37:43,520] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt. +25: [2023-05-10 12:37:43,520] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +25: [2023-05-10 12:37:43,520] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt... +25: [2023-05-10 12:37:43,520] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt... + 0: [2023-05-10 12:37:43,520] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +27: [2023-05-10 12:37:43,520] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. + 0: [2023-05-10 12:37:43,520] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt... +27: [2023-05-10 12:37:43,521] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. + 9: [2023-05-10 12:37:43,521] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +27: [2023-05-10 12:37:43,521] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt... +27: [2023-05-10 12:37:43,521] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt... + 9: [2023-05-10 12:37:43,522] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +21: [2023-05-10 12:37:43,522] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt... + 7: [2023-05-10 12:37:43,521] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +12: [2023-05-10 12:37:43,522] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +12: [2023-05-10 12:37:43,523] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... + 7: [2023-05-10 12:37:43,523] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +16: [2023-05-10 12:37:43,523] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. + 7: [2023-05-10 12:37:43,523] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt... +12: [2023-05-10 12:37:43,524] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... + 9: [2023-05-10 12:37:43,524] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +25: [2023-05-10 12:37:43,524] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +25: [2023-05-10 12:37:43,524] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt... +16: [2023-05-10 12:37:43,525] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt... +25: [2023-05-10 12:37:43,525] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +25: [2023-05-10 12:37:43,525] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt... +12: [2023-05-10 12:37:43,525] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +27: [2023-05-10 12:37:43,526] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +27: [2023-05-10 12:37:43,526] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt... + 7: [2023-05-10 12:37:43,526] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. + 7: [2023-05-10 12:37:43,526] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. + 7: [2023-05-10 12:37:43,526] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt... + 6: [2023-05-10 12:37:43,526] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt. + 6: [2023-05-10 12:37:43,526] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt. + 6: [2023-05-10 12:37:43,526] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt. + 6: [2023-05-10 12:37:43,527] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt. + 7: [2023-05-10 12:37:43,527] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt... + 4: [2023-05-10 12:37:43,528] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt. +16: [2023-05-10 12:37:43,528] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. + 4: [2023-05-10 12:37:43,528] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt. +16: [2023-05-10 12:37:43,528] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt... +26: [2023-05-10 12:37:43,528] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +26: [2023-05-10 12:37:43,529] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +24: [2023-05-10 12:37:43,529] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +16: [2023-05-10 12:37:43,529] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +26: [2023-05-10 12:37:43,529] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +26: [2023-05-10 12:37:43,529] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +16: [2023-05-10 12:37:43,529] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt... +26: [2023-05-10 12:37:43,529] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +26: [2023-05-10 12:37:43,529] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +26: [2023-05-10 12:37:43,529] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... + 4: [2023-05-10 12:37:43,529] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt. + 4: [2023-05-10 12:37:43,529] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt. +10: [2023-05-10 12:37:43,529] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +10: [2023-05-10 12:37:43,529] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +10: [2023-05-10 12:37:43,529] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +13: [2023-05-10 12:37:43,529] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +10: [2023-05-10 12:37:43,529] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +10: [2023-05-10 12:37:43,529] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +10: [2023-05-10 12:37:43,529] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +10: [2023-05-10 12:37:43,529] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. + 1: [2023-05-10 12:37:43,530] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. + 1: [2023-05-10 12:37:43,530] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. + 1: [2023-05-10 12:37:43,530] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. + 1: [2023-05-10 12:37:43,530] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... + 1: [2023-05-10 12:37:43,530] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... + 1: [2023-05-10 12:37:43,530] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... + 1: [2023-05-10 12:37:43,530] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. + 1: [2023-05-10 12:37:43,530] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +13: [2023-05-10 12:37:43,530] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +27: [2023-05-10 12:37:43,531] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +26: [2023-05-10 12:37:43,531] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +27: [2023-05-10 12:37:43,532] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt... + 9: [2023-05-10 12:37:43,532] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +10: [2023-05-10 12:37:43,532] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +13: [2023-05-10 12:37:43,532] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +13: [2023-05-10 12:37:43,533] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... + 9: [2023-05-10 12:37:43,533] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt... +12: [2023-05-10 12:37:43,534] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +12: [2023-05-10 12:37:43,534] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt... +10: [2023-05-10 12:37:43,535] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt. +10: [2023-05-10 12:37:43,535] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt. + 9: [2023-05-10 12:37:43,537] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. + 4: [2023-05-10 12:37:43,537] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +16: [2023-05-10 12:37:43,537] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. + 9: [2023-05-10 12:37:43,537] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt... + 4: [2023-05-10 12:37:43,537] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... + 6: [2023-05-10 12:37:43,538] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... + 9: [2023-05-10 12:37:43,538] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. + 9: [2023-05-10 12:37:43,538] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt... + 6: [2023-05-10 12:37:43,539] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... + 6: [2023-05-10 12:37:43,539] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... + 6: [2023-05-10 12:37:43,539] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... + 4: [2023-05-10 12:37:43,539] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +16: [2023-05-10 12:37:43,539] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt... + 4: [2023-05-10 12:37:43,539] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +10: [2023-05-10 12:37:43,540] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt. +26: [2023-05-10 12:37:43,540] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +10: [2023-05-10 12:37:43,540] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt. +12: [2023-05-10 12:37:43,541] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +29: [2023-05-10 12:37:43,541] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt. +12: [2023-05-10 12:37:43,541] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt... +29: [2023-05-10 12:37:43,541] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt. +29: [2023-05-10 12:37:43,541] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt. +26: [2023-05-10 12:37:43,541] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +29: [2023-05-10 12:37:43,542] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt. + 1: [2023-05-10 12:37:43,543] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +13: [2023-05-10 12:37:43,543] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +13: [2023-05-10 12:37:43,544] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt... +26: [2023-05-10 12:37:43,545] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. + 1: [2023-05-10 12:37:43,545] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. + 1: [2023-05-10 12:37:43,545] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +10: [2023-05-10 12:37:43,545] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +10: [2023-05-10 12:37:43,545] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... + 2: [2023-05-10 12:37:43,546] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt. + 2: [2023-05-10 12:37:43,546] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt. + 2: [2023-05-10 12:37:43,546] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt. + 2: [2023-05-10 12:37:43,546] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt. +12: [2023-05-10 12:37:43,546] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +10: [2023-05-10 12:37:43,547] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +12: [2023-05-10 12:37:43,547] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt... + 1: [2023-05-10 12:37:43,548] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +28: [2023-05-10 12:37:43,549] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt. +28: [2023-05-10 12:37:43,549] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt. +10: [2023-05-10 12:37:43,549] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +10: [2023-05-10 12:37:43,549] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +28: [2023-05-10 12:37:43,550] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt. +26: [2023-05-10 12:37:43,550] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +28: [2023-05-10 12:37:43,550] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt. +10: [2023-05-10 12:37:43,550] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +15: [2023-05-10 12:37:43,550] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt. +15: [2023-05-10 12:37:43,551] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt. +10: [2023-05-10 12:37:43,551] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... + 9: [2023-05-10 12:37:43,551] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +29: [2023-05-10 12:37:43,551] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +29: [2023-05-10 12:37:43,551] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +29: [2023-05-10 12:37:43,551] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +26: [2023-05-10 12:37:43,551] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +15: [2023-05-10 12:37:43,552] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt. +29: [2023-05-10 12:37:43,552] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +12: [2023-05-10 12:37:43,552] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +15: [2023-05-10 12:37:43,552] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt. + 9: [2023-05-10 12:37:43,552] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt... + 4: [2023-05-10 12:37:43,552] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. + 4: [2023-05-10 12:37:43,553] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. + 4: [2023-05-10 12:37:43,553] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt... + 4: [2023-05-10 12:37:43,553] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt... +12: [2023-05-10 12:37:43,553] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt... +13: [2023-05-10 12:37:43,554] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. + 1: [2023-05-10 12:37:43,554] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... + 1: [2023-05-10 12:37:43,555] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +18: [2023-05-10 12:37:43,555] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt. +18: [2023-05-10 12:37:43,555] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt. + 4: [2023-05-10 12:37:43,555] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. + 4: [2023-05-10 12:37:43,555] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. + 4: [2023-05-10 12:37:43,555] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt... + 4: [2023-05-10 12:37:43,555] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt... + 2: [2023-05-10 12:37:43,555] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... + 2: [2023-05-10 12:37:43,555] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +13: [2023-05-10 12:37:43,555] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt... + 2: [2023-05-10 12:37:43,556] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... + 2: [2023-05-10 12:37:43,556] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +26: [2023-05-10 12:37:43,556] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +18: [2023-05-10 12:37:43,556] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt. +18: [2023-05-10 12:37:43,556] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_19-model_01-model_states.pt. +13: [2023-05-10 12:37:43,557] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +13: [2023-05-10 12:37:43,557] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. + 6: [2023-05-10 12:37:43,556] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. + 1: [2023-05-10 12:37:43,557] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... + 6: [2023-05-10 12:37:43,557] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. + 6: [2023-05-10 12:37:43,557] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt... + 6: [2023-05-10 12:37:43,557] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. + 6: [2023-05-10 12:37:43,557] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt... + 6: [2023-05-10 12:37:43,557] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt... +10: [2023-05-10 12:37:43,557] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... + 1: [2023-05-10 12:37:43,558] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +13: [2023-05-10 12:37:43,558] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt... +13: [2023-05-10 12:37:43,558] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt... +28: [2023-05-10 12:37:43,559] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +28: [2023-05-10 12:37:43,559] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +28: [2023-05-10 12:37:43,559] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +10: [2023-05-10 12:37:43,559] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +28: [2023-05-10 12:37:43,560] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +10: [2023-05-10 12:37:43,561] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +15: [2023-05-10 12:37:43,561] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... + 6: [2023-05-10 12:37:43,561] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. + 6: [2023-05-10 12:37:43,561] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt... +15: [2023-05-10 12:37:43,562] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +15: [2023-05-10 12:37:43,562] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +15: [2023-05-10 12:37:43,562] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +26: [2023-05-10 12:37:43,565] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +10: [2023-05-10 12:37:43,565] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +10: [2023-05-10 12:37:43,566] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt... +18: [2023-05-10 12:37:43,566] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +18: [2023-05-10 12:37:43,566] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +18: [2023-05-10 12:37:43,566] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +10: [2023-05-10 12:37:43,567] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +10: [2023-05-10 12:37:43,567] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +10: [2023-05-10 12:37:43,567] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt... +10: [2023-05-10 12:37:43,567] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt... +18: [2023-05-10 12:37:43,568] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt... +31: [2023-05-10 12:37:43,569] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt. +31: [2023-05-10 12:37:43,569] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt. +31: [2023-05-10 12:37:43,569] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt. +31: [2023-05-10 12:37:43,569] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt. +27: [2023-05-10 12:37:43,569] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +27: [2023-05-10 12:37:43,570] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +27: [2023-05-10 12:37:43,570] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +27: [2023-05-10 12:37:43,570] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +27: [2023-05-10 12:37:43,570] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +27: [2023-05-10 12:37:43,570] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +27: [2023-05-10 12:37:43,570] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +27: [2023-05-10 12:37:43,570] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +10: [2023-05-10 12:37:43,571] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +10: [2023-05-10 12:37:43,571] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt... + 2: [2023-05-10 12:37:43,571] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. + 2: [2023-05-10 12:37:43,571] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt... +10: [2023-05-10 12:37:43,571] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +28: [2023-05-10 12:37:43,571] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +28: [2023-05-10 12:37:43,572] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt... +15: [2023-05-10 12:37:43,574] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. + 2: [2023-05-10 12:37:43,574] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +28: [2023-05-10 12:37:43,574] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +28: [2023-05-10 12:37:43,574] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +28: [2023-05-10 12:37:43,574] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt... +28: [2023-05-10 12:37:43,574] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt... +26: [2023-05-10 12:37:43,575] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... + 2: [2023-05-10 12:37:43,575] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. + 2: [2023-05-10 12:37:43,575] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt... + 2: [2023-05-10 12:37:43,575] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. + 2: [2023-05-10 12:37:43,575] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt... + 2: [2023-05-10 12:37:43,575] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt... +15: [2023-05-10 12:37:43,576] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt... + 9: [2023-05-10 12:37:43,578] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. + 9: [2023-05-10 12:37:43,578] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. + 9: [2023-05-10 12:37:43,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... + 9: [2023-05-10 12:37:43,578] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. + 9: [2023-05-10 12:37:43,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... + 9: [2023-05-10 12:37:43,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... + 9: [2023-05-10 12:37:43,578] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. + 9: [2023-05-10 12:37:43,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +31: [2023-05-10 12:37:43,579] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +31: [2023-05-10 12:37:43,579] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +31: [2023-05-10 12:37:43,579] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +15: [2023-05-10 12:37:43,579] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +31: [2023-05-10 12:37:43,579] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +15: [2023-05-10 12:37:43,579] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt... +28: [2023-05-10 12:37:43,579] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +28: [2023-05-10 12:37:43,579] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt... +15: [2023-05-10 12:37:43,580] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +15: [2023-05-10 12:37:43,580] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt... +18: [2023-05-10 12:37:43,581] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +18: [2023-05-10 12:37:43,581] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +18: [2023-05-10 12:37:43,582] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +18: [2023-05-10 12:37:43,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt... +18: [2023-05-10 12:37:43,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt... +18: [2023-05-10 12:37:43,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt... +27: [2023-05-10 12:37:43,582] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +10: [2023-05-10 12:37:43,583] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +30: [2023-05-10 12:37:43,583] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt. +27: [2023-05-10 12:37:43,583] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +30: [2023-05-10 12:37:43,583] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt. +30: [2023-05-10 12:37:43,583] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt. +30: [2023-05-10 12:37:43,583] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt. +15: [2023-05-10 12:37:43,584] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +27: [2023-05-10 12:37:43,584] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +15: [2023-05-10 12:37:43,585] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt... +18: [2023-05-10 12:37:43,587] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_00-model_states.pt. +18: [2023-05-10 12:37:43,588] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt... +25: [2023-05-10 12:37:43,588] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +25: [2023-05-10 12:37:43,588] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +25: [2023-05-10 12:37:43,588] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +25: [2023-05-10 12:37:43,588] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... + 3: [2023-05-10 12:37:43,588] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. + 3: [2023-05-10 12:37:43,588] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. + 3: [2023-05-10 12:37:43,588] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +25: [2023-05-10 12:37:43,588] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +25: [2023-05-10 12:37:43,588] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... + 3: [2023-05-10 12:37:43,588] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... + 3: [2023-05-10 12:37:43,588] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +25: [2023-05-10 12:37:43,588] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. + 3: [2023-05-10 12:37:43,588] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +17: [2023-05-10 12:37:43,588] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +17: [2023-05-10 12:37:43,588] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +17: [2023-05-10 12:37:43,589] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +17: [2023-05-10 12:37:43,589] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... + 3: [2023-05-10 12:37:43,589] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +25: [2023-05-10 12:37:43,590] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +27: [2023-05-10 12:37:43,591] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +29: [2023-05-10 12:37:43,591] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +29: [2023-05-10 12:37:43,591] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +27: [2023-05-10 12:37:43,591] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +29: [2023-05-10 12:37:43,591] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +29: [2023-05-10 12:37:43,591] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +29: [2023-05-10 12:37:43,591] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +29: [2023-05-10 12:37:43,591] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +29: [2023-05-10 12:37:43,591] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +29: [2023-05-10 12:37:43,591] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +29: [2023-05-10 12:37:43,591] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +29: [2023-05-10 12:37:43,591] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +29: [2023-05-10 12:37:43,591] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +29: [2023-05-10 12:37:43,591] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. + 3: [2023-05-10 12:37:43,591] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +22: [2023-05-10 12:37:43,591] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt. +22: [2023-05-10 12:37:43,591] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt. +22: [2023-05-10 12:37:43,591] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt. +29: [2023-05-10 12:37:43,592] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt... +29: [2023-05-10 12:37:43,592] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt... +31: [2023-05-10 12:37:43,592] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +29: [2023-05-10 12:37:43,592] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt... +29: [2023-05-10 12:37:43,592] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt... +22: [2023-05-10 12:37:43,592] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt. +31: [2023-05-10 12:37:43,592] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +31: [2023-05-10 12:37:43,592] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +27: [2023-05-10 12:37:43,592] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +31: [2023-05-10 12:37:43,592] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +30: [2023-05-10 12:37:43,592] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +17: [2023-05-10 12:37:43,592] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +17: [2023-05-10 12:37:43,592] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +30: [2023-05-10 12:37:43,592] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +17: [2023-05-10 12:37:43,592] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +17: [2023-05-10 12:37:43,593] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +30: [2023-05-10 12:37:43,594] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +31: [2023-05-10 12:37:43,594] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +30: [2023-05-10 12:37:43,595] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +27: [2023-05-10 12:37:43,595] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +31: [2023-05-10 12:37:43,596] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +31: [2023-05-10 12:37:43,597] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +31: [2023-05-10 12:37:43,598] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt... +31: [2023-05-10 12:37:43,598] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +31: [2023-05-10 12:37:43,598] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +31: [2023-05-10 12:37:43,598] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt... +25: [2023-05-10 12:37:43,599] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +31: [2023-05-10 12:37:43,599] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +25: [2023-05-10 12:37:43,600] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +27: [2023-05-10 12:37:43,600] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +17: [2023-05-10 12:37:43,600] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +25: [2023-05-10 12:37:43,601] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +22: [2023-05-10 12:37:43,602] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +22: [2023-05-10 12:37:43,602] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +17: [2023-05-10 12:37:43,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +22: [2023-05-10 12:37:43,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +29: [2023-05-10 12:37:43,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +22: [2023-05-10 12:37:43,604] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +31: [2023-05-10 12:37:43,604] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +29: [2023-05-10 12:37:43,604] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +31: [2023-05-10 12:37:43,604] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +31: [2023-05-10 12:37:43,604] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt... + 3: [2023-05-10 12:37:43,605] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +31: [2023-05-10 12:37:43,606] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. + 3: [2023-05-10 12:37:43,606] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. + 3: [2023-05-10 12:37:43,606] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +29: [2023-05-10 12:37:43,607] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +31: [2023-05-10 12:37:43,607] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt... +17: [2023-05-10 12:37:43,608] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +25: [2023-05-10 12:37:43,609] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +17: [2023-05-10 12:37:43,609] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +31: [2023-05-10 12:37:43,609] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +17: [2023-05-10 12:37:43,610] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +25: [2023-05-10 12:37:43,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +25: [2023-05-10 12:37:43,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... + 3: [2023-05-10 12:37:43,614] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +17: [2023-05-10 12:37:43,614] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +31: [2023-05-10 12:37:43,614] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +29: [2023-05-10 12:37:43,615] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +29: [2023-05-10 12:37:43,617] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +17: [2023-05-10 12:37:43,617] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +29: [2023-05-10 12:37:43,617] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... + 3: [2023-05-10 12:37:43,618] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +31: [2023-05-10 12:37:43,619] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +17: [2023-05-10 12:37:43,619] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +31: [2023-05-10 12:37:43,619] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. + 9: [2023-05-10 12:37:43,590] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. + 9: [2023-05-10 12:37:43,592] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. + 9: [2023-05-10 12:37:43,598] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. + 9: [2023-05-10 12:37:43,599] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... + 9: [2023-05-10 12:37:43,599] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. + 9: [2023-05-10 12:37:43,604] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... + 9: [2023-05-10 12:37:43,610] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... + 9: [2023-05-10 12:37:43,610] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +29: [2023-05-10 12:37:43,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... + 3: [2023-05-10 12:37:43,621] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +25: [2023-05-10 12:37:43,621] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. + 5: [2023-05-10 12:37:43,621] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt. + 5: [2023-05-10 12:37:43,621] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt. + 5: [2023-05-10 12:37:43,621] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt. + 5: [2023-05-10 12:37:43,622] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt. +29: [2023-05-10 12:37:43,623] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +31: [2023-05-10 12:37:43,624] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +14: [2023-05-10 12:37:43,624] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt. +14: [2023-05-10 12:37:43,624] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt. +14: [2023-05-10 12:37:43,625] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt. +14: [2023-05-10 12:37:43,625] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt. + 3: [2023-05-10 12:37:43,626] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +31: [2023-05-10 12:37:43,628] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... + 8: [2023-05-10 12:37:43,629] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. + 8: [2023-05-10 12:37:43,629] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... + 8: [2023-05-10 12:37:43,629] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. + 8: [2023-05-10 12:37:43,629] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... + 8: [2023-05-10 12:37:43,629] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. + 8: [2023-05-10 12:37:43,629] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. + 8: [2023-05-10 12:37:43,629] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... + 8: [2023-05-10 12:37:43,629] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +25: [2023-05-10 12:37:43,630] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... + 5: [2023-05-10 12:37:43,631] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +19: [2023-05-10 12:37:43,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt. +19: [2023-05-10 12:37:43,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt. +19: [2023-05-10 12:37:43,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt. + 5: [2023-05-10 12:37:43,631] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... + 5: [2023-05-10 12:37:43,631] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +31: [2023-05-10 12:37:43,633] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +19: [2023-05-10 12:37:43,633] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt. + 5: [2023-05-10 12:37:43,633] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +14: [2023-05-10 12:37:43,633] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +14: [2023-05-10 12:37:43,634] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +14: [2023-05-10 12:37:43,634] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... + 3: [2023-05-10 12:37:43,635] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +14: [2023-05-10 12:37:43,637] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... + 8: [2023-05-10 12:37:43,640] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +19: [2023-05-10 12:37:43,645] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +26: [2023-05-10 12:37:43,644] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt. +26: [2023-05-10 12:37:43,645] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt. +19: [2023-05-10 12:37:43,646] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +26: [2023-05-10 12:37:43,646] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt. +26: [2023-05-10 12:37:43,646] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt. +19: [2023-05-10 12:37:43,646] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +19: [2023-05-10 12:37:43,647] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... + 8: [2023-05-10 12:37:43,648] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. + 8: [2023-05-10 12:37:43,649] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. + 8: [2023-05-10 12:37:43,650] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +11: [2023-05-10 12:37:43,653] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt. +11: [2023-05-10 12:37:43,653] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt. +11: [2023-05-10 12:37:43,653] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt. +11: [2023-05-10 12:37:43,653] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt. +26: [2023-05-10 12:37:43,655] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... + 8: [2023-05-10 12:37:43,657] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +26: [2023-05-10 12:37:43,658] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +26: [2023-05-10 12:37:43,658] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... + 8: [2023-05-10 12:37:43,658] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +26: [2023-05-10 12:37:43,660] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... + 8: [2023-05-10 12:37:43,661] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +11: [2023-05-10 12:37:43,662] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +11: [2023-05-10 12:37:43,663] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +20: [2023-05-10 12:37:43,665] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt. +11: [2023-05-10 12:37:43,665] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +20: [2023-05-10 12:37:43,665] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt. +20: [2023-05-10 12:37:43,666] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt. +11: [2023-05-10 12:37:43,666] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +20: [2023-05-10 12:37:43,666] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt. + 8: [2023-05-10 12:37:43,666] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... + 2: [2023-05-10 12:37:43,667] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. + 2: [2023-05-10 12:37:43,668] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. + 2: [2023-05-10 12:37:43,668] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. + 2: [2023-05-10 12:37:43,668] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... + 2: [2023-05-10 12:37:43,668] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... + 2: [2023-05-10 12:37:43,668] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +19: [2023-05-10 12:37:43,668] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +19: [2023-05-10 12:37:43,669] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. + 2: [2023-05-10 12:37:43,669] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +19: [2023-05-10 12:37:43,669] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +14: [2023-05-10 12:37:43,669] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +14: [2023-05-10 12:37:43,669] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +14: [2023-05-10 12:37:43,669] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +14: [2023-05-10 12:37:43,669] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +14: [2023-05-10 12:37:43,669] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +14: [2023-05-10 12:37:43,669] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +14: [2023-05-10 12:37:43,669] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +14: [2023-05-10 12:37:43,669] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +19: [2023-05-10 12:37:43,669] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +19: [2023-05-10 12:37:43,669] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +19: [2023-05-10 12:37:43,669] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +14: [2023-05-10 12:37:43,669] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +14: [2023-05-10 12:37:43,669] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +19: [2023-05-10 12:37:43,669] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +19: [2023-05-10 12:37:43,669] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. + 2: [2023-05-10 12:37:43,669] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +19: [2023-05-10 12:37:43,669] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +19: [2023-05-10 12:37:43,669] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +14: [2023-05-10 12:37:43,669] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +19: [2023-05-10 12:37:43,669] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt... +19: [2023-05-10 12:37:43,669] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt... +19: [2023-05-10 12:37:43,669] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt... +19: [2023-05-10 12:37:43,669] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +19: [2023-05-10 12:37:43,669] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt... +14: [2023-05-10 12:37:43,669] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +19: [2023-05-10 12:37:43,669] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +14: [2023-05-10 12:37:43,669] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt... +14: [2023-05-10 12:37:43,669] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt... +14: [2023-05-10 12:37:43,669] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt... +14: [2023-05-10 12:37:43,671] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt... +26: [2023-05-10 12:37:43,672] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +26: [2023-05-10 12:37:43,673] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt... + 1: [2023-05-10 12:37:43,674] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt. + 1: [2023-05-10 12:37:43,674] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt. + 1: [2023-05-10 12:37:43,674] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt. + 1: [2023-05-10 12:37:43,674] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt. +20: [2023-05-10 12:37:43,675] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +20: [2023-05-10 12:37:43,675] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +26: [2023-05-10 12:37:43,677] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +20: [2023-05-10 12:37:43,679] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +20: [2023-05-10 12:37:43,679] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +26: [2023-05-10 12:37:43,678] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt... + 2: [2023-05-10 12:37:43,681] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +26: [2023-05-10 12:37:43,681] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +19: [2023-05-10 12:37:43,681] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +26: [2023-05-10 12:37:43,681] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt... +14: [2023-05-10 12:37:43,681] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +19: [2023-05-10 12:37:43,681] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +14: [2023-05-10 12:37:43,682] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +14: [2023-05-10 12:37:43,683] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. + 1: [2023-05-10 12:37:43,684] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... + 1: [2023-05-10 12:37:43,684] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... + 2: [2023-05-10 12:37:43,684] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. + 2: [2023-05-10 12:37:43,684] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. + 1: [2023-05-10 12:37:43,685] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... + 1: [2023-05-10 12:37:43,685] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +19: [2023-05-10 12:37:43,685] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +19: [2023-05-10 12:37:43,685] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +18: [2023-05-10 12:37:43,688] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +18: [2023-05-10 12:37:43,688] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +18: [2023-05-10 12:37:43,688] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +18: [2023-05-10 12:37:43,688] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +18: [2023-05-10 12:37:43,688] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +18: [2023-05-10 12:37:43,688] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... + 2: [2023-05-10 12:37:43,689] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +18: [2023-05-10 12:37:43,690] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +14: [2023-05-10 12:37:43,691] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +14: [2023-05-10 12:37:43,693] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +18: [2023-05-10 12:37:43,692] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +19: [2023-05-10 12:37:43,693] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +14: [2023-05-10 12:37:43,693] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +14: [2023-05-10 12:37:43,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... + 2: [2023-05-10 12:37:43,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... + 2: [2023-05-10 12:37:43,695] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +26: [2023-05-10 12:37:43,695] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +26: [2023-05-10 12:37:43,697] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt... + 2: [2023-05-10 12:37:43,698] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +19: [2023-05-10 12:37:43,698] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... + 1: [2023-05-10 12:37:43,699] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +19: [2023-05-10 12:37:43,699] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +19: [2023-05-10 12:37:43,699] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... + 1: [2023-05-10 12:37:43,699] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt... + 3: [2023-05-10 12:37:43,700] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt. + 3: [2023-05-10 12:37:43,700] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt. + 3: [2023-05-10 12:37:43,700] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt. + 1: [2023-05-10 12:37:43,700] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. + 1: [2023-05-10 12:37:43,700] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. + 1: [2023-05-10 12:37:43,701] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt... + 1: [2023-05-10 12:37:43,701] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt... + 3: [2023-05-10 12:37:43,701] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt. +14: [2023-05-10 12:37:43,701] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +24: [2023-05-10 12:37:43,702] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt. +24: [2023-05-10 12:37:43,702] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt. +24: [2023-05-10 12:37:43,702] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt. +24: [2023-05-10 12:37:43,702] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt. + 2: [2023-05-10 12:37:43,706] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... + 4: [2023-05-10 12:37:43,708] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. + 4: [2023-05-10 12:37:43,709] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... + 4: [2023-05-10 12:37:43,709] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. + 4: [2023-05-10 12:37:43,709] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. + 4: [2023-05-10 12:37:43,709] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... + 4: [2023-05-10 12:37:43,709] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... + 4: [2023-05-10 12:37:43,709] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. + 4: [2023-05-10 12:37:43,709] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... + 1: [2023-05-10 12:37:43,709] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +18: [2023-05-10 12:37:43,710] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +18: [2023-05-10 12:37:43,710] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +18: [2023-05-10 12:37:43,710] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. + 1: [2023-05-10 12:37:43,711] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt... +24: [2023-05-10 12:37:43,711] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +24: [2023-05-10 12:37:43,711] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +24: [2023-05-10 12:37:43,711] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... + 8: [2023-05-10 12:37:43,712] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt. + 8: [2023-05-10 12:37:43,712] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt. + 8: [2023-05-10 12:37:43,712] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt. +23: [2023-05-10 12:37:43,712] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +21: [2023-05-10 12:37:43,712] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +23: [2023-05-10 12:37:43,712] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... + 8: [2023-05-10 12:37:43,712] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt. +21: [2023-05-10 12:37:43,712] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +21: [2023-05-10 12:37:43,712] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +21: [2023-05-10 12:37:43,712] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. + 3: [2023-05-10 12:37:43,712] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +21: [2023-05-10 12:37:43,712] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +21: [2023-05-10 12:37:43,712] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +21: [2023-05-10 12:37:43,712] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +23: [2023-05-10 12:37:43,712] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. + 3: [2023-05-10 12:37:43,713] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +24: [2023-05-10 12:37:43,714] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +21: [2023-05-10 12:37:43,714] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +23: [2023-05-10 12:37:43,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +23: [2023-05-10 12:37:43,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +23: [2023-05-10 12:37:43,714] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... + 0: [2023-05-10 12:37:43,715] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. + 0: [2023-05-10 12:37:43,715] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. + 0: [2023-05-10 12:37:43,715] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. + 0: [2023-05-10 12:37:43,715] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... + 3: [2023-05-10 12:37:43,715] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +23: [2023-05-10 12:37:43,715] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... + 0: [2023-05-10 12:37:43,715] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. + 3: [2023-05-10 12:37:43,715] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +23: [2023-05-10 12:37:43,716] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... + 0: [2023-05-10 12:37:43,716] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +28: [2023-05-10 12:37:43,716] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +28: [2023-05-10 12:37:43,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +28: [2023-05-10 12:37:43,717] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +28: [2023-05-10 12:37:43,717] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +28: [2023-05-10 12:37:43,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +28: [2023-05-10 12:37:43,717] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. + 0: [2023-05-10 12:37:43,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +28: [2023-05-10 12:37:43,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... + 0: [2023-05-10 12:37:43,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... + 5: [2023-05-10 12:37:43,717] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. + 5: [2023-05-10 12:37:43,717] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. + 5: [2023-05-10 12:37:43,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... + 5: [2023-05-10 12:37:43,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt... + 7: [2023-05-10 12:37:43,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. + 6: [2023-05-10 12:37:43,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. + 7: [2023-05-10 12:37:43,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... + 7: [2023-05-10 12:37:43,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. + 7: [2023-05-10 12:37:43,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. + 7: [2023-05-10 12:37:43,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +28: [2023-05-10 12:37:43,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... + 6: [2023-05-10 12:37:43,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... + 5: [2023-05-10 12:37:43,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. + 5: [2023-05-10 12:37:43,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. + 5: [2023-05-10 12:37:43,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. + 5: [2023-05-10 12:37:43,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. + 7: [2023-05-10 12:37:43,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... + 6: [2023-05-10 12:37:43,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. + 5: [2023-05-10 12:37:43,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt... + 5: [2023-05-10 12:37:43,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt... + 5: [2023-05-10 12:37:43,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... + 5: [2023-05-10 12:37:43,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... + 6: [2023-05-10 12:37:43,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. + 6: [2023-05-10 12:37:43,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... + 6: [2023-05-10 12:37:43,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... + 6: [2023-05-10 12:37:43,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. + 6: [2023-05-10 12:37:43,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... + 5: [2023-05-10 12:37:43,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +18: [2023-05-10 12:37:43,720] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... + 5: [2023-05-10 12:37:43,720] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. + 5: [2023-05-10 12:37:43,721] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +18: [2023-05-10 12:37:43,721] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +18: [2023-05-10 12:37:43,721] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... + 7: [2023-05-10 12:37:43,722] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... + 5: [2023-05-10 12:37:43,722] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt... + 7: [2023-05-10 12:37:43,723] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... + 8: [2023-05-10 12:37:43,723] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... + 8: [2023-05-10 12:37:43,723] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... + 8: [2023-05-10 12:37:43,723] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +23: [2023-05-10 12:37:43,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +21: [2023-05-10 12:37:43,725] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. + 4: [2023-05-10 12:37:43,725] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. + 4: [2023-05-10 12:37:43,725] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +24: [2023-05-10 12:37:43,725] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +21: [2023-05-10 12:37:43,726] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +24: [2023-05-10 12:37:43,726] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt... +21: [2023-05-10 12:37:43,726] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. + 8: [2023-05-10 12:37:43,726] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +24: [2023-05-10 12:37:43,727] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +24: [2023-05-10 12:37:43,727] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt... + 4: [2023-05-10 12:37:43,727] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. + 4: [2023-05-10 12:37:43,727] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +24: [2023-05-10 12:37:43,729] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +24: [2023-05-10 12:37:43,729] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt... + 7: [2023-05-10 12:37:43,730] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +28: [2023-05-10 12:37:43,730] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. + 5: [2023-05-10 12:37:43,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +24: [2023-05-10 12:37:43,732] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +23: [2023-05-10 12:37:43,732] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +24: [2023-05-10 12:37:43,732] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt... + 3: [2023-05-10 12:37:43,733] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. + 3: [2023-05-10 12:37:43,733] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. + 0: [2023-05-10 12:37:43,733] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. + 3: [2023-05-10 12:37:43,734] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt... + 3: [2023-05-10 12:37:43,734] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt... +18: [2023-05-10 12:37:43,734] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. + 7: [2023-05-10 12:37:43,734] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. + 4: [2023-05-10 12:37:43,734] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... + 6: [2023-05-10 12:37:43,734] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. + 6: [2023-05-10 12:37:43,734] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +16: [2023-05-10 12:37:43,735] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +16: [2023-05-10 12:37:43,735] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +16: [2023-05-10 12:37:43,735] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +16: [2023-05-10 12:37:43,735] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +16: [2023-05-10 12:37:43,735] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... + 6: [2023-05-10 12:37:43,735] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. + 6: [2023-05-10 12:37:43,735] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +28: [2023-05-10 12:37:43,735] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +28: [2023-05-10 12:37:43,735] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +21: [2023-05-10 12:37:43,735] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... + 5: [2023-05-10 12:37:43,736] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. + 5: [2023-05-10 12:37:43,736] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +12: [2023-05-10 12:37:43,736] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +16: [2023-05-10 12:37:43,736] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +16: [2023-05-10 12:37:43,736] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +16: [2023-05-10 12:37:43,736] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +12: [2023-05-10 12:37:43,736] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +12: [2023-05-10 12:37:43,736] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +12: [2023-05-10 12:37:43,736] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +12: [2023-05-10 12:37:43,736] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +12: [2023-05-10 12:37:43,736] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... + 4: [2023-05-10 12:37:43,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +21: [2023-05-10 12:37:43,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +12: [2023-05-10 12:37:43,738] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. + 8: [2023-05-10 12:37:43,737] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. + 8: [2023-05-10 12:37:43,738] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt... +21: [2023-05-10 12:37:43,738] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +23: [2023-05-10 12:37:43,738] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. + 3: [2023-05-10 12:37:43,738] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +12: [2023-05-10 12:37:43,739] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... + 8: [2023-05-10 12:37:43,739] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. + 8: [2023-05-10 12:37:43,740] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt... +28: [2023-05-10 12:37:43,740] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... + 3: [2023-05-10 12:37:43,740] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt... + 3: [2023-05-10 12:37:43,740] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. + 4: [2023-05-10 12:37:43,740] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... + 4: [2023-05-10 12:37:43,740] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +11: [2023-05-10 12:37:43,741] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +11: [2023-05-10 12:37:43,741] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +11: [2023-05-10 12:37:43,741] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +11: [2023-05-10 12:37:43,741] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +11: [2023-05-10 12:37:43,741] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +11: [2023-05-10 12:37:43,741] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +11: [2023-05-10 12:37:43,741] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +21: [2023-05-10 12:37:43,742] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +11: [2023-05-10 12:37:43,741] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +30: [2023-05-10 12:37:43,742] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +30: [2023-05-10 12:37:43,742] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +11: [2023-05-10 12:37:43,742] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt... +11: [2023-05-10 12:37:43,742] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt... +30: [2023-05-10 12:37:43,742] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +30: [2023-05-10 12:37:43,742] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +30: [2023-05-10 12:37:43,742] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +30: [2023-05-10 12:37:43,742] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +30: [2023-05-10 12:37:43,742] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... + 3: [2023-05-10 12:37:43,742] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt... +30: [2023-05-10 12:37:43,742] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +30: [2023-05-10 12:37:43,742] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt... + 7: [2023-05-10 12:37:43,742] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +30: [2023-05-10 12:37:43,742] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt... +18: [2023-05-10 12:37:43,742] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... + 5: [2023-05-10 12:37:43,743] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +30: [2023-05-10 12:37:43,743] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +30: [2023-05-10 12:37:43,743] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +11: [2023-05-10 12:37:43,743] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +11: [2023-05-10 12:37:43,743] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +11: [2023-05-10 12:37:43,743] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +11: [2023-05-10 12:37:43,743] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +30: [2023-05-10 12:37:43,743] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +30: [2023-05-10 12:37:43,743] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt... + 6: [2023-05-10 12:37:43,744] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +15: [2023-05-10 12:37:43,744] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +15: [2023-05-10 12:37:43,744] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +15: [2023-05-10 12:37:43,744] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +15: [2023-05-10 12:37:43,744] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +15: [2023-05-10 12:37:43,744] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +15: [2023-05-10 12:37:43,744] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +15: [2023-05-10 12:37:43,744] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +30: [2023-05-10 12:37:43,744] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... + 6: [2023-05-10 12:37:43,744] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... + 6: [2023-05-10 12:37:43,745] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +28: [2023-05-10 12:37:43,745] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +28: [2023-05-10 12:37:43,745] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +30: [2023-05-10 12:37:43,745] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt... +11: [2023-05-10 12:37:43,745] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt... + 0: [2023-05-10 12:37:43,745] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +15: [2023-05-10 12:37:43,746] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... + 6: [2023-05-10 12:37:43,746] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +11: [2023-05-10 12:37:43,746] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt... + 7: [2023-05-10 12:37:43,747] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... + 5: [2023-05-10 12:37:43,747] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... + 0: [2023-05-10 12:37:43,747] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. + 5: [2023-05-10 12:37:43,747] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +23: [2023-05-10 12:37:43,747] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +23: [2023-05-10 12:37:43,748] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +24: [2023-05-10 12:37:43,748] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +24: [2023-05-10 12:37:43,748] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. + 8: [2023-05-10 12:37:43,748] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +24: [2023-05-10 12:37:43,748] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +24: [2023-05-10 12:37:43,748] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +24: [2023-05-10 12:37:43,748] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +24: [2023-05-10 12:37:43,748] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +24: [2023-05-10 12:37:43,748] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +24: [2023-05-10 12:37:43,748] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +16: [2023-05-10 12:37:43,748] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. + 5: [2023-05-10 12:37:43,749] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +23: [2023-05-10 12:37:43,749] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. + 8: [2023-05-10 12:37:43,750] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt... + 8: [2023-05-10 12:37:43,751] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +21: [2023-05-10 12:37:43,751] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +26: [2023-05-10 12:37:43,751] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +26: [2023-05-10 12:37:43,751] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +26: [2023-05-10 12:37:43,751] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +26: [2023-05-10 12:37:43,751] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +26: [2023-05-10 12:37:43,751] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +26: [2023-05-10 12:37:43,751] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +26: [2023-05-10 12:37:43,751] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +12: [2023-05-10 12:37:43,751] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. + 7: [2023-05-10 12:37:43,751] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +26: [2023-05-10 12:37:43,751] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +12: [2023-05-10 12:37:43,751] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +12: [2023-05-10 12:37:43,751] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. + 8: [2023-05-10 12:37:43,752] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt... +16: [2023-05-10 12:37:43,754] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt. + 0: [2023-05-10 12:37:43,754] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. + 0: [2023-05-10 12:37:43,754] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +16: [2023-05-10 12:37:43,754] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt. +16: [2023-05-10 12:37:43,754] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt. +16: [2023-05-10 12:37:43,754] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt. +28: [2023-05-10 12:37:43,754] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. + 7: [2023-05-10 12:37:43,755] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +15: [2023-05-10 12:37:43,756] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. + 0: [2023-05-10 12:37:43,757] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +11: [2023-05-10 12:37:43,757] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +11: [2023-05-10 12:37:43,757] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +23: [2023-05-10 12:37:43,757] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +16: [2023-05-10 12:37:43,757] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +16: [2023-05-10 12:37:43,757] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +11: [2023-05-10 12:37:43,757] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +11: [2023-05-10 12:37:43,757] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +30: [2023-05-10 12:37:43,757] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. + 5: [2023-05-10 12:37:43,758] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +23: [2023-05-10 12:37:43,759] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +30: [2023-05-10 12:37:43,759] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +15: [2023-05-10 12:37:43,760] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +24: [2023-05-10 12:37:43,760] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +16: [2023-05-10 12:37:43,761] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +24: [2023-05-10 12:37:43,761] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +12: [2023-05-10 12:37:43,761] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +15: [2023-05-10 12:37:43,761] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +12: [2023-05-10 12:37:43,762] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... + 7: [2023-05-10 12:37:43,762] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +26: [2023-05-10 12:37:43,762] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +28: [2023-05-10 12:37:43,763] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +12: [2023-05-10 12:37:43,763] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +24: [2023-05-10 12:37:43,764] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +16: [2023-05-10 12:37:43,764] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +16: [2023-05-10 12:37:43,764] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +26: [2023-05-10 12:37:43,764] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +15: [2023-05-10 12:37:43,764] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... + 0: [2023-05-10 12:37:43,765] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... + 0: [2023-05-10 12:37:43,765] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +16: [2023-05-10 12:37:43,765] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +17: [2023-05-10 12:37:43,765] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt. +17: [2023-05-10 12:37:43,765] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt. +17: [2023-05-10 12:37:43,765] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt. +16: [2023-05-10 12:37:43,765] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +12: [2023-05-10 12:37:43,766] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. + 7: [2023-05-10 12:37:43,767] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +26: [2023-05-10 12:37:43,767] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +17: [2023-05-10 12:37:43,767] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt. +16: [2023-05-10 12:37:43,767] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +30: [2023-05-10 12:37:43,768] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... + 4: [2023-05-10 12:37:43,768] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt. + 4: [2023-05-10 12:37:43,768] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt. + 4: [2023-05-10 12:37:43,768] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt. + 4: [2023-05-10 12:37:43,769] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt. +30: [2023-05-10 12:37:43,769] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +16: [2023-05-10 12:37:43,769] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +30: [2023-05-10 12:37:43,769] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +11: [2023-05-10 12:37:43,769] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +11: [2023-05-10 12:37:43,769] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +11: [2023-05-10 12:37:43,769] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... + 1: [2023-05-10 12:37:43,769] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. + 1: [2023-05-10 12:37:43,769] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. + 1: [2023-05-10 12:37:43,769] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +26: [2023-05-10 12:37:43,769] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. + 1: [2023-05-10 12:37:43,769] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +24: [2023-05-10 12:37:43,770] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... + 1: [2023-05-10 12:37:43,770] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. + 1: [2023-05-10 12:37:43,770] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. + 1: [2023-05-10 12:37:43,770] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +24: [2023-05-10 12:37:43,770] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +25: [2023-05-10 12:37:43,770] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt. +25: [2023-05-10 12:37:43,770] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt. +25: [2023-05-10 12:37:43,770] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt. +24: [2023-05-10 12:37:43,770] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +25: [2023-05-10 12:37:43,770] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt. + 9: [2023-05-10 12:37:43,770] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. + 9: [2023-05-10 12:37:43,771] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... + 9: [2023-05-10 12:37:43,771] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. + 9: [2023-05-10 12:37:43,771] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. + 9: [2023-05-10 12:37:43,771] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... + 1: [2023-05-10 12:37:43,771] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +15: [2023-05-10 12:37:43,771] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +26: [2023-05-10 12:37:43,771] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... + 9: [2023-05-10 12:37:43,771] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. + 9: [2023-05-10 12:37:43,771] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +11: [2023-05-10 12:37:43,771] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... + 9: [2023-05-10 12:37:43,772] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +16: [2023-05-10 12:37:43,772] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +26: [2023-05-10 12:37:43,773] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +15: [2023-05-10 12:37:43,774] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +12: [2023-05-10 12:37:43,775] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +17: [2023-05-10 12:37:43,775] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +24: [2023-05-10 12:37:43,775] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +30: [2023-05-10 12:37:43,775] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +17: [2023-05-10 12:37:43,776] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +17: [2023-05-10 12:37:43,777] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +15: [2023-05-10 12:37:43,777] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +26: [2023-05-10 12:37:43,777] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +17: [2023-05-10 12:37:43,778] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... + 4: [2023-05-10 12:37:43,778] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... + 4: [2023-05-10 12:37:43,778] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +30: [2023-05-10 12:37:43,778] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +26: [2023-05-10 12:37:43,779] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +24: [2023-05-10 12:37:43,780] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... + 4: [2023-05-10 12:37:43,780] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +25: [2023-05-10 12:37:43,780] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... + 4: [2023-05-10 12:37:43,780] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +20: [2023-05-10 12:37:43,780] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +25: [2023-05-10 12:37:43,780] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +20: [2023-05-10 12:37:43,781] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +20: [2023-05-10 12:37:43,781] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +20: [2023-05-10 12:37:43,781] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +20: [2023-05-10 12:37:43,781] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +25: [2023-05-10 12:37:43,781] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +20: [2023-05-10 12:37:43,781] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt... +16: [2023-05-10 12:37:43,781] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +20: [2023-05-10 12:37:43,782] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +20: [2023-05-10 12:37:43,783] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt... +20: [2023-05-10 12:37:43,783] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. + 9: [2023-05-10 12:37:43,783] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +20: [2023-05-10 12:37:43,783] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt... +27: [2023-05-10 12:37:43,783] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +27: [2023-05-10 12:37:43,783] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +20: [2023-05-10 12:37:43,783] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +20: [2023-05-10 12:37:43,783] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +20: [2023-05-10 12:37:43,783] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +27: [2023-05-10 12:37:43,783] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +27: [2023-05-10 12:37:43,783] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +20: [2023-05-10 12:37:43,783] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +27: [2023-05-10 12:37:43,783] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +27: [2023-05-10 12:37:43,783] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +30: [2023-05-10 12:37:43,784] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +25: [2023-05-10 12:37:43,784] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +27: [2023-05-10 12:37:43,784] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +16: [2023-05-10 12:37:43,784] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. + 1: [2023-05-10 12:37:43,784] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. + 1: [2023-05-10 12:37:43,784] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. + 1: [2023-05-10 12:37:43,784] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +16: [2023-05-10 12:37:43,785] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +16: [2023-05-10 12:37:43,785] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +20: [2023-05-10 12:37:43,785] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +16: [2023-05-10 12:37:43,785] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt... +16: [2023-05-10 12:37:43,785] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt... +16: [2023-05-10 12:37:43,785] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt... +27: [2023-05-10 12:37:43,785] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +20: [2023-05-10 12:37:43,785] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt... + 9: [2023-05-10 12:37:43,786] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. + 9: [2023-05-10 12:37:43,786] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +15: [2023-05-10 12:37:43,786] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +17: [2023-05-10 12:37:43,788] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +17: [2023-05-10 12:37:43,789] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt... +16: [2023-05-10 12:37:43,790] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +16: [2023-05-10 12:37:43,790] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt... + 9: [2023-05-10 12:37:43,791] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +17: [2023-05-10 12:37:43,792] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +17: [2023-05-10 12:37:43,792] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt... + 4: [2023-05-10 12:37:43,792] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. + 4: [2023-05-10 12:37:43,793] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt... +22: [2023-05-10 12:37:43,793] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +22: [2023-05-10 12:37:43,793] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +22: [2023-05-10 12:37:43,793] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +22: [2023-05-10 12:37:43,793] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +22: [2023-05-10 12:37:43,793] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +22: [2023-05-10 12:37:43,793] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +22: [2023-05-10 12:37:43,793] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +22: [2023-05-10 12:37:43,794] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +22: [2023-05-10 12:37:43,794] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +22: [2023-05-10 12:37:43,794] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +22: [2023-05-10 12:37:43,794] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +22: [2023-05-10 12:37:43,794] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +22: [2023-05-10 12:37:43,794] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt... +22: [2023-05-10 12:37:43,794] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt... +31: [2023-05-10 12:37:43,794] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +31: [2023-05-10 12:37:43,794] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +31: [2023-05-10 12:37:43,794] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +31: [2023-05-10 12:37:43,794] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +31: [2023-05-10 12:37:43,794] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +31: [2023-05-10 12:37:43,794] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. + 1: [2023-05-10 12:37:43,794] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +31: [2023-05-10 12:37:43,795] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +27: [2023-05-10 12:37:43,794] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. + 1: [2023-05-10 12:37:43,795] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... + 1: [2023-05-10 12:37:43,795] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +20: [2023-05-10 12:37:43,795] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +20: [2023-05-10 12:37:43,795] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +31: [2023-05-10 12:37:43,796] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... + 9: [2023-05-10 12:37:43,796] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +22: [2023-05-10 12:37:43,796] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt... +27: [2023-05-10 12:37:43,796] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +22: [2023-05-10 12:37:43,796] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt... + 4: [2023-05-10 12:37:43,796] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. + 4: [2023-05-10 12:37:43,796] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt... +27: [2023-05-10 12:37:43,796] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +13: [2023-05-10 12:37:43,796] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +13: [2023-05-10 12:37:43,797] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +13: [2023-05-10 12:37:43,797] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +13: [2023-05-10 12:37:43,797] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +13: [2023-05-10 12:37:43,797] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +13: [2023-05-10 12:37:43,797] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +13: [2023-05-10 12:37:43,797] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +13: [2023-05-10 12:37:43,797] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +25: [2023-05-10 12:37:43,797] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. + 9: [2023-05-10 12:37:43,797] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +17: [2023-05-10 12:37:43,797] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +17: [2023-05-10 12:37:43,798] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt... +25: [2023-05-10 12:37:43,798] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt... +20: [2023-05-10 12:37:43,797] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. + 1: [2023-05-10 12:37:43,798] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +25: [2023-05-10 12:37:43,798] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +25: [2023-05-10 12:37:43,798] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt... + 9: [2023-05-10 12:37:43,800] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +27: [2023-05-10 12:37:43,803] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... + 4: [2023-05-10 12:37:43,804] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +20: [2023-05-10 12:37:43,805] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +20: [2023-05-10 12:37:43,805] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +27: [2023-05-10 12:37:43,805] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +22: [2023-05-10 12:37:43,805] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +31: [2023-05-10 12:37:43,805] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. + 4: [2023-05-10 12:37:43,805] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt... +25: [2023-05-10 12:37:43,805] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. + 1: [2023-05-10 12:37:43,806] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +20: [2023-05-10 12:37:43,806] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +25: [2023-05-10 12:37:43,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt... +27: [2023-05-10 12:37:43,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +17: [2023-05-10 12:37:43,807] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +13: [2023-05-10 12:37:43,807] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. + 4: [2023-05-10 12:37:43,808] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +17: [2023-05-10 12:37:43,809] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt... + 9: [2023-05-10 12:37:43,809] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +31: [2023-05-10 12:37:43,809] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +31: [2023-05-10 12:37:43,809] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. + 4: [2023-05-10 12:37:43,810] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt... +25: [2023-05-10 12:37:43,810] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +25: [2023-05-10 12:37:43,812] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt... +29: [2023-05-10 12:37:43,812] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +29: [2023-05-10 12:37:43,812] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +29: [2023-05-10 12:37:43,812] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +29: [2023-05-10 12:37:43,812] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +27: [2023-05-10 12:37:43,812] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +29: [2023-05-10 12:37:43,812] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +29: [2023-05-10 12:37:43,813] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +22: [2023-05-10 12:37:43,812] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +22: [2023-05-10 12:37:43,812] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +22: [2023-05-10 12:37:43,813] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +29: [2023-05-10 12:37:43,814] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +29: [2023-05-10 12:37:43,814] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +31: [2023-05-10 12:37:43,814] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +23: [2023-05-10 12:37:43,815] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt. +23: [2023-05-10 12:37:43,815] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt. +23: [2023-05-10 12:37:43,815] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt. +23: [2023-05-10 12:37:43,816] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt. +13: [2023-05-10 12:37:43,816] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +13: [2023-05-10 12:37:43,816] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +13: [2023-05-10 12:37:43,816] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +20: [2023-05-10 12:37:43,817] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +13: [2023-05-10 12:37:43,817] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +22: [2023-05-10 12:37:43,818] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +31: [2023-05-10 12:37:43,818] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +31: [2023-05-10 12:37:43,820] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +27: [2023-05-10 12:37:43,821] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +31: [2023-05-10 12:37:43,821] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +22: [2023-05-10 12:37:43,822] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +22: [2023-05-10 12:37:43,822] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +29: [2023-05-10 12:37:43,823] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +23: [2023-05-10 12:37:43,824] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +22: [2023-05-10 12:37:43,824] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +23: [2023-05-10 12:37:43,824] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... + 0: [2023-05-10 12:37:43,824] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt. + 0: [2023-05-10 12:37:43,824] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt. + 0: [2023-05-10 12:37:43,825] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt. + 0: [2023-05-10 12:37:43,825] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt. +20: [2023-05-10 12:37:43,825] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +23: [2023-05-10 12:37:43,826] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +29: [2023-05-10 12:37:43,826] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. + 7: [2023-05-10 12:37:43,827] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt. + 7: [2023-05-10 12:37:43,827] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt. +31: [2023-05-10 12:37:43,828] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... + 7: [2023-05-10 12:37:43,827] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt. +17: [2023-05-10 12:37:43,828] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +17: [2023-05-10 12:37:43,828] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +17: [2023-05-10 12:37:43,828] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +17: [2023-05-10 12:37:43,828] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +17: [2023-05-10 12:37:43,828] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +17: [2023-05-10 12:37:43,828] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +17: [2023-05-10 12:37:43,829] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +23: [2023-05-10 12:37:43,829] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +13: [2023-05-10 12:37:43,829] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... + 7: [2023-05-10 12:37:43,829] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt. +17: [2023-05-10 12:37:43,830] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +13: [2023-05-10 12:37:43,830] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +13: [2023-05-10 12:37:43,830] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... + 0: [2023-05-10 12:37:43,834] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +29: [2023-05-10 12:37:43,834] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... + 0: [2023-05-10 12:37:43,835] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... + 0: [2023-05-10 12:37:43,835] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +18: [2023-05-10 12:37:43,836] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt. +18: [2023-05-10 12:37:43,836] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt. +18: [2023-05-10 12:37:43,836] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt. +18: [2023-05-10 12:37:43,836] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt. +27: [2023-05-10 12:37:43,837] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt. +29: [2023-05-10 12:37:43,837] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... + 0: [2023-05-10 12:37:43,837] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +27: [2023-05-10 12:37:43,837] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt. +27: [2023-05-10 12:37:43,837] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt. +13: [2023-05-10 12:37:43,837] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt. +27: [2023-05-10 12:37:43,837] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt. +29: [2023-05-10 12:37:43,838] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +23: [2023-05-10 12:37:43,838] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +15: [2023-05-10 12:37:43,839] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt. +15: [2023-05-10 12:37:43,839] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt. +23: [2023-05-10 12:37:43,839] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt... +15: [2023-05-10 12:37:43,839] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt. +15: [2023-05-10 12:37:43,839] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt. +29: [2023-05-10 12:37:43,840] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. + 7: [2023-05-10 12:37:43,840] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +21: [2023-05-10 12:37:43,841] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt. +17: [2023-05-10 12:37:43,840] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +21: [2023-05-10 12:37:43,841] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt. +13: [2023-05-10 12:37:43,841] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt. + 7: [2023-05-10 12:37:43,841] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +17: [2023-05-10 12:37:43,841] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +13: [2023-05-10 12:37:43,842] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt. +13: [2023-05-10 12:37:43,842] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt. + 7: [2023-05-10 12:37:43,843] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +21: [2023-05-10 12:37:43,843] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt. +21: [2023-05-10 12:37:43,844] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt. + 7: [2023-05-10 12:37:43,844] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +17: [2023-05-10 12:37:43,844] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +23: [2023-05-10 12:37:43,844] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +23: [2023-05-10 12:37:43,845] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt... +13: [2023-05-10 12:37:43,846] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +18: [2023-05-10 12:37:43,847] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +27: [2023-05-10 12:37:43,846] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +29: [2023-05-10 12:37:43,847] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +18: [2023-05-10 12:37:43,847] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +27: [2023-05-10 12:37:43,846] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +27: [2023-05-10 12:37:43,848] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +27: [2023-05-10 12:37:43,848] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +15: [2023-05-10 12:37:43,849] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +29: [2023-05-10 12:37:43,849] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +15: [2023-05-10 12:37:43,849] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +13: [2023-05-10 12:37:43,850] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +18: [2023-05-10 12:37:43,850] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +18: [2023-05-10 12:37:43,850] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +21: [2023-05-10 12:37:43,850] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... + 0: [2023-05-10 12:37:43,850] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. + 0: [2023-05-10 12:37:43,851] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt... +15: [2023-05-10 12:37:43,852] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... + 0: [2023-05-10 12:37:43,852] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. + 0: [2023-05-10 12:37:43,852] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt... + 7: [2023-05-10 12:37:43,852] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +15: [2023-05-10 12:37:43,852] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +21: [2023-05-10 12:37:43,853] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... + 7: [2023-05-10 12:37:43,853] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt... +17: [2023-05-10 12:37:43,853] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +21: [2023-05-10 12:37:43,854] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +21: [2023-05-10 12:37:43,854] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +13: [2023-05-10 12:37:43,854] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +13: [2023-05-10 12:37:43,854] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +17: [2023-05-10 12:37:43,856] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +17: [2023-05-10 12:37:43,856] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +23: [2023-05-10 12:37:43,855] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. + 7: [2023-05-10 12:37:43,856] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. + 7: [2023-05-10 12:37:43,856] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. + 7: [2023-05-10 12:37:43,856] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt... + 7: [2023-05-10 12:37:43,856] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt... +17: [2023-05-10 12:37:43,857] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +23: [2023-05-10 12:37:43,857] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt... +23: [2023-05-10 12:37:43,858] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +10: [2023-05-10 12:37:43,859] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt. +10: [2023-05-10 12:37:43,859] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt. +28: [2023-05-10 12:37:43,859] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt. +10: [2023-05-10 12:37:43,859] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt. +10: [2023-05-10 12:37:43,859] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt. +28: [2023-05-10 12:37:43,859] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt. +28: [2023-05-10 12:37:43,859] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt. +28: [2023-05-10 12:37:43,859] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt. +23: [2023-05-10 12:37:43,860] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt... + 9: [2023-05-10 12:37:43,861] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt. + 9: [2023-05-10 12:37:43,861] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt. + 9: [2023-05-10 12:37:43,861] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt. +15: [2023-05-10 12:37:43,861] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. + 0: [2023-05-10 12:37:43,861] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. + 9: [2023-05-10 12:37:43,861] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt. +27: [2023-05-10 12:37:43,862] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +27: [2023-05-10 12:37:43,862] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +27: [2023-05-10 12:37:43,862] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt... +27: [2023-05-10 12:37:43,862] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt... + 0: [2023-05-10 12:37:43,863] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt... +12: [2023-05-10 12:37:43,862] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt. +12: [2023-05-10 12:37:43,862] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt. +15: [2023-05-10 12:37:43,863] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt... +13: [2023-05-10 12:37:43,864] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +18: [2023-05-10 12:37:43,864] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +29: [2023-05-10 12:37:43,864] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt. +29: [2023-05-10 12:37:43,864] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt. +29: [2023-05-10 12:37:43,864] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt. +18: [2023-05-10 12:37:43,864] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +29: [2023-05-10 12:37:43,864] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt. + 2: [2023-05-10 12:37:43,864] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt. +18: [2023-05-10 12:37:43,865] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt... + 0: [2023-05-10 12:37:43,865] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. + 2: [2023-05-10 12:37:43,865] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt. + 2: [2023-05-10 12:37:43,865] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt. + 2: [2023-05-10 12:37:43,865] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt. +13: [2023-05-10 12:37:43,866] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt... +18: [2023-05-10 12:37:43,866] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt... +12: [2023-05-10 12:37:43,866] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt. +12: [2023-05-10 12:37:43,866] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_20-model_01-model_states.pt. +17: [2023-05-10 12:37:43,866] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... + 0: [2023-05-10 12:37:43,866] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt... +21: [2023-05-10 12:37:43,867] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +21: [2023-05-10 12:37:43,867] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt... +10: [2023-05-10 12:37:43,868] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +10: [2023-05-10 12:37:43,868] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +15: [2023-05-10 12:37:43,868] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +15: [2023-05-10 12:37:43,868] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt... +28: [2023-05-10 12:37:43,869] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +28: [2023-05-10 12:37:43,869] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +28: [2023-05-10 12:37:43,869] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +18: [2023-05-10 12:37:43,870] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +18: [2023-05-10 12:37:43,870] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt... +27: [2023-05-10 12:37:43,870] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +13: [2023-05-10 12:37:43,870] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +28: [2023-05-10 12:37:43,870] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +18: [2023-05-10 12:37:43,871] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +13: [2023-05-10 12:37:43,871] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt... +18: [2023-05-10 12:37:43,871] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt... + 9: [2023-05-10 12:37:43,871] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +13: [2023-05-10 12:37:43,871] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +21: [2023-05-10 12:37:43,871] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +13: [2023-05-10 12:37:43,871] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +13: [2023-05-10 12:37:43,871] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt... +21: [2023-05-10 12:37:43,871] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt... +13: [2023-05-10 12:37:43,871] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt... +12: [2023-05-10 12:37:43,871] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +10: [2023-05-10 12:37:43,871] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +27: [2023-05-10 12:37:43,872] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt... + 9: [2023-05-10 12:37:43,872] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... + 7: [2023-05-10 12:37:43,872] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +12: [2023-05-10 12:37:43,873] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... + 9: [2023-05-10 12:37:43,873] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... + 9: [2023-05-10 12:37:43,873] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +15: [2023-05-10 12:37:43,874] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +29: [2023-05-10 12:37:43,874] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +29: [2023-05-10 12:37:43,874] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +29: [2023-05-10 12:37:43,874] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +15: [2023-05-10 12:37:43,874] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt... +10: [2023-05-10 12:37:43,874] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +21: [2023-05-10 12:37:43,874] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. + 7: [2023-05-10 12:37:43,874] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt... + 2: [2023-05-10 12:37:43,874] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... + 2: [2023-05-10 12:37:43,874] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +29: [2023-05-10 12:37:43,874] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +21: [2023-05-10 12:37:43,874] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. + 2: [2023-05-10 12:37:43,875] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +21: [2023-05-10 12:37:43,875] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt... +12: [2023-05-10 12:37:43,875] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +27: [2023-05-10 12:37:43,875] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. + 2: [2023-05-10 12:37:43,875] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +21: [2023-05-10 12:37:43,876] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt... +12: [2023-05-10 12:37:43,876] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt... +27: [2023-05-10 12:37:43,877] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt... +15: [2023-05-10 12:37:43,878] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +15: [2023-05-10 12:37:43,880] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt... +28: [2023-05-10 12:37:43,881] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +28: [2023-05-10 12:37:43,881] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt... +28: [2023-05-10 12:37:43,882] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +28: [2023-05-10 12:37:43,882] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +28: [2023-05-10 12:37:43,883] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt... +28: [2023-05-10 12:37:43,883] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt... +10: [2023-05-10 12:37:43,883] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +10: [2023-05-10 12:37:43,883] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +10: [2023-05-10 12:37:43,884] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +10: [2023-05-10 12:37:43,884] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +10: [2023-05-10 12:37:43,885] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +10: [2023-05-10 12:37:43,885] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +10: [2023-05-10 12:37:43,886] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +10: [2023-05-10 12:37:43,886] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +10: [2023-05-10 12:37:43,886] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt... +12: [2023-05-10 12:37:43,885] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +10: [2023-05-10 12:37:43,886] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt... +10: [2023-05-10 12:37:43,886] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +12: [2023-05-10 12:37:43,886] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +12: [2023-05-10 12:37:43,886] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt... +12: [2023-05-10 12:37:43,886] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt... +29: [2023-05-10 12:37:43,887] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +29: [2023-05-10 12:37:43,888] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt... +10: [2023-05-10 12:37:43,888] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... + 2: [2023-05-10 12:37:43,890] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. + 2: [2023-05-10 12:37:43,890] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. + 2: [2023-05-10 12:37:43,890] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt... + 2: [2023-05-10 12:37:43,890] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt... + 9: [2023-05-10 12:37:43,891] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. + 9: [2023-05-10 12:37:43,891] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. + 9: [2023-05-10 12:37:43,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. + 9: [2023-05-10 12:37:43,892] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt... + 9: [2023-05-10 12:37:43,892] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt... + 9: [2023-05-10 12:37:43,892] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt... + 9: [2023-05-10 12:37:43,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +28: [2023-05-10 12:37:43,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. + 2: [2023-05-10 12:37:43,893] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. + 2: [2023-05-10 12:37:43,893] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt... +12: [2023-05-10 12:37:43,893] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +28: [2023-05-10 12:37:43,894] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt... +12: [2023-05-10 12:37:43,894] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt... +29: [2023-05-10 12:37:43,894] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. + 9: [2023-05-10 12:37:43,894] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt... +29: [2023-05-10 12:37:43,894] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt... +29: [2023-05-10 12:37:43,894] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +29: [2023-05-10 12:37:43,894] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt... +12: [2023-05-10 12:37:43,894] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +12: [2023-05-10 12:37:43,894] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt... +29: [2023-05-10 12:37:43,894] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +29: [2023-05-10 12:37:43,896] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt... + 2: [2023-05-10 12:37:43,899] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +10: [2023-05-10 12:37:43,899] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +10: [2023-05-10 12:37:43,900] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. + 2: [2023-05-10 12:37:43,900] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt... +10: [2023-05-10 12:37:43,902] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt... +10: [2023-05-10 12:37:43,903] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +10: [2023-05-10 12:37:43,904] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_00-model_states.pt. +10: [2023-05-10 12:37:43,905] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +10: [2023-05-10 12:37:43,907] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +10: [2023-05-10 12:37:43,907] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt... +25: [2023-05-10 12:37:43,909] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +25: [2023-05-10 12:37:43,909] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +25: [2023-05-10 12:37:43,909] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +25: [2023-05-10 12:37:43,909] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +25: [2023-05-10 12:37:43,909] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +25: [2023-05-10 12:37:43,909] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +25: [2023-05-10 12:37:43,910] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +25: [2023-05-10 12:37:43,911] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +10: [2023-05-10 12:37:43,916] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +10: [2023-05-10 12:37:43,916] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... + 8: [2023-05-10 12:37:43,917] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. + 8: [2023-05-10 12:37:43,917] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. + 8: [2023-05-10 12:37:43,917] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. + 8: [2023-05-10 12:37:43,917] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... + 8: [2023-05-10 12:37:43,917] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... + 8: [2023-05-10 12:37:43,917] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... + 8: [2023-05-10 12:37:43,918] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. + 8: [2023-05-10 12:37:43,920] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +25: [2023-05-10 12:37:43,921] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +10: [2023-05-10 12:37:43,922] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +25: [2023-05-10 12:37:43,925] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +25: [2023-05-10 12:37:43,930] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +25: [2023-05-10 12:37:43,932] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +10: [2023-05-10 12:37:43,933] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +25: [2023-05-10 12:37:43,934] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +14: [2023-05-10 12:37:43,936] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt. +14: [2023-05-10 12:37:43,936] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt. +14: [2023-05-10 12:37:43,936] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt. +14: [2023-05-10 12:37:43,936] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt. + 6: [2023-05-10 12:37:43,937] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt. + 6: [2023-05-10 12:37:43,937] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt. + 6: [2023-05-10 12:37:43,937] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt. + 6: [2023-05-10 12:37:43,937] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt. + 8: [2023-05-10 12:37:43,937] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. + 8: [2023-05-10 12:37:43,937] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. + 8: [2023-05-10 12:37:43,937] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +25: [2023-05-10 12:37:43,939] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +25: [2023-05-10 12:37:43,940] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... + 8: [2023-05-10 12:37:43,944] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +14: [2023-05-10 12:37:43,945] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +14: [2023-05-10 12:37:43,945] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... + 8: [2023-05-10 12:37:43,947] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... + 8: [2023-05-10 12:37:43,947] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +14: [2023-05-10 12:37:43,947] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... + 6: [2023-05-10 12:37:43,948] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... + 6: [2023-05-10 12:37:43,948] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +14: [2023-05-10 12:37:43,948] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... + 6: [2023-05-10 12:37:43,948] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... + 6: [2023-05-10 12:37:43,948] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +25: [2023-05-10 12:37:43,949] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... + 8: [2023-05-10 12:37:43,950] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +19: [2023-05-10 12:37:43,951] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt. +19: [2023-05-10 12:37:43,951] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt. +19: [2023-05-10 12:37:43,951] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt. + 1: [2023-05-10 12:37:43,951] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt. + 1: [2023-05-10 12:37:43,951] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt. + 1: [2023-05-10 12:37:43,951] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt. +19: [2023-05-10 12:37:43,952] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt. + 1: [2023-05-10 12:37:43,952] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt. + 8: [2023-05-10 12:37:43,954] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +14: [2023-05-10 12:37:43,957] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +14: [2023-05-10 12:37:43,957] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +14: [2023-05-10 12:37:43,957] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +14: [2023-05-10 12:37:43,959] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +14: [2023-05-10 12:37:43,960] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +14: [2023-05-10 12:37:43,960] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +14: [2023-05-10 12:37:43,960] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +14: [2023-05-10 12:37:43,960] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. + 1: [2023-05-10 12:37:43,960] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +14: [2023-05-10 12:37:43,961] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt... + 1: [2023-05-10 12:37:43,961] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... + 2: [2023-05-10 12:37:43,961] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. + 2: [2023-05-10 12:37:43,961] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. + 2: [2023-05-10 12:37:43,961] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. + 2: [2023-05-10 12:37:43,961] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... + 2: [2023-05-10 12:37:43,961] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... + 2: [2023-05-10 12:37:43,961] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... + 2: [2023-05-10 12:37:43,962] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +14: [2023-05-10 12:37:43,962] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... + 2: [2023-05-10 12:37:43,962] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... + 8: [2023-05-10 12:37:43,962] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt. + 8: [2023-05-10 12:37:43,962] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt. + 8: [2023-05-10 12:37:43,962] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt. + 8: [2023-05-10 12:37:43,962] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt. + 3: [2023-05-10 12:37:43,963] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. + 3: [2023-05-10 12:37:43,963] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. + 3: [2023-05-10 12:37:43,963] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... + 3: [2023-05-10 12:37:43,963] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... + 1: [2023-05-10 12:37:43,963] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... + 1: [2023-05-10 12:37:43,964] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... + 3: [2023-05-10 12:37:43,964] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +19: [2023-05-10 12:37:43,964] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... + 3: [2023-05-10 12:37:43,964] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. + 3: [2023-05-10 12:37:43,965] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +19: [2023-05-10 12:37:43,965] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... + 6: [2023-05-10 12:37:43,965] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. + 6: [2023-05-10 12:37:43,965] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt... +23: [2023-05-10 12:37:43,965] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +23: [2023-05-10 12:37:43,966] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +23: [2023-05-10 12:37:43,966] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +23: [2023-05-10 12:37:43,966] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +23: [2023-05-10 12:37:43,966] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +23: [2023-05-10 12:37:43,966] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +19: [2023-05-10 12:37:43,966] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +23: [2023-05-10 12:37:43,966] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. + 3: [2023-05-10 12:37:43,966] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +23: [2023-05-10 12:37:43,966] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +18: [2023-05-10 12:37:43,967] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +18: [2023-05-10 12:37:43,967] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +18: [2023-05-10 12:37:43,967] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +19: [2023-05-10 12:37:43,967] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... + 6: [2023-05-10 12:37:43,968] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +18: [2023-05-10 12:37:43,968] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. + 6: [2023-05-10 12:37:43,968] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +18: [2023-05-10 12:37:43,968] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. + 6: [2023-05-10 12:37:43,968] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt... + 6: [2023-05-10 12:37:43,968] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt... +18: [2023-05-10 12:37:43,968] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +18: [2023-05-10 12:37:43,968] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +18: [2023-05-10 12:37:43,968] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +14: [2023-05-10 12:37:43,969] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +14: [2023-05-10 12:37:43,969] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt... + 0: [2023-05-10 12:37:43,969] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. + 0: [2023-05-10 12:37:43,969] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. + 0: [2023-05-10 12:37:43,969] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. + 0: [2023-05-10 12:37:43,970] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... + 0: [2023-05-10 12:37:43,970] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +11: [2023-05-10 12:37:43,970] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. + 0: [2023-05-10 12:37:43,970] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. + 0: [2023-05-10 12:37:43,970] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +11: [2023-05-10 12:37:43,970] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +11: [2023-05-10 12:37:43,970] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +11: [2023-05-10 12:37:43,970] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +11: [2023-05-10 12:37:43,970] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +30: [2023-05-10 12:37:43,970] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +30: [2023-05-10 12:37:43,970] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +30: [2023-05-10 12:37:43,971] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +30: [2023-05-10 12:37:43,971] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +16: [2023-05-10 12:37:43,970] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +16: [2023-05-10 12:37:43,970] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +16: [2023-05-10 12:37:43,971] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +16: [2023-05-10 12:37:43,971] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +11: [2023-05-10 12:37:43,971] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +11: [2023-05-10 12:37:43,971] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... + 8: [2023-05-10 12:37:43,971] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +19: [2023-05-10 12:37:43,971] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +19: [2023-05-10 12:37:43,971] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +19: [2023-05-10 12:37:43,971] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +19: [2023-05-10 12:37:43,971] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +19: [2023-05-10 12:37:43,971] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +11: [2023-05-10 12:37:43,971] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +19: [2023-05-10 12:37:43,972] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. + 8: [2023-05-10 12:37:43,972] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... + 8: [2023-05-10 12:37:43,972] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... + 5: [2023-05-10 12:37:43,972] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. + 5: [2023-05-10 12:37:43,973] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +14: [2023-05-10 12:37:43,973] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. + 0: [2023-05-10 12:37:43,973] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +19: [2023-05-10 12:37:43,973] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +14: [2023-05-10 12:37:43,973] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +30: [2023-05-10 12:37:43,973] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +30: [2023-05-10 12:37:43,973] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +30: [2023-05-10 12:37:43,974] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +19: [2023-05-10 12:37:43,974] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... + 2: [2023-05-10 12:37:43,974] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. + 8: [2023-05-10 12:37:43,974] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... + 5: [2023-05-10 12:37:43,974] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. + 5: [2023-05-10 12:37:43,974] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +30: [2023-05-10 12:37:43,975] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... + 6: [2023-05-10 12:37:43,975] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +16: [2023-05-10 12:37:43,976] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +16: [2023-05-10 12:37:43,976] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. + 6: [2023-05-10 12:37:43,977] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt... + 2: [2023-05-10 12:37:43,977] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +23: [2023-05-10 12:37:43,977] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +16: [2023-05-10 12:37:43,977] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +13: [2023-05-10 12:37:43,978] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +13: [2023-05-10 12:37:43,978] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +16: [2023-05-10 12:37:43,978] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +13: [2023-05-10 12:37:43,978] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +13: [2023-05-10 12:37:43,978] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +12: [2023-05-10 12:37:43,978] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. + 3: [2023-05-10 12:37:43,978] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +12: [2023-05-10 12:37:43,978] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +12: [2023-05-10 12:37:43,979] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +12: [2023-05-10 12:37:43,979] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +12: [2023-05-10 12:37:43,979] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +12: [2023-05-10 12:37:43,979] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +21: [2023-05-10 12:37:43,979] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +21: [2023-05-10 12:37:43,979] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +21: [2023-05-10 12:37:43,980] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +14: [2023-05-10 12:37:43,980] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. + 5: [2023-05-10 12:37:43,979] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. + 5: [2023-05-10 12:37:43,979] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +21: [2023-05-10 12:37:43,980] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +21: [2023-05-10 12:37:43,980] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... + 2: [2023-05-10 12:37:43,980] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. + 5: [2023-05-10 12:37:43,981] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... + 5: [2023-05-10 12:37:43,981] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... + 1: [2023-05-10 12:37:43,980] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. + 1: [2023-05-10 12:37:43,980] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +21: [2023-05-10 12:37:43,981] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... + 1: [2023-05-10 12:37:43,981] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt... + 1: [2023-05-10 12:37:43,981] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt... +13: [2023-05-10 12:37:43,981] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +21: [2023-05-10 12:37:43,982] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +13: [2023-05-10 12:37:43,982] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +23: [2023-05-10 12:37:43,982] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +14: [2023-05-10 12:37:43,982] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +14: [2023-05-10 12:37:43,982] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt... +19: [2023-05-10 12:37:43,982] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +19: [2023-05-10 12:37:43,982] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +23: [2023-05-10 12:37:43,982] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +13: [2023-05-10 12:37:43,982] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +12: [2023-05-10 12:37:43,982] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +20: [2023-05-10 12:37:43,982] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +20: [2023-05-10 12:37:43,982] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +20: [2023-05-10 12:37:43,982] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +20: [2023-05-10 12:37:43,983] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +20: [2023-05-10 12:37:43,983] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +14: [2023-05-10 12:37:43,983] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +20: [2023-05-10 12:37:43,983] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +20: [2023-05-10 12:37:43,983] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +19: [2023-05-10 12:37:43,983] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt... +20: [2023-05-10 12:37:43,983] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +13: [2023-05-10 12:37:43,983] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +14: [2023-05-10 12:37:43,983] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... + 3: [2023-05-10 12:37:43,983] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. + 3: [2023-05-10 12:37:43,983] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +19: [2023-05-10 12:37:43,983] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt... +19: [2023-05-10 12:37:43,983] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +19: [2023-05-10 12:37:43,984] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt... +21: [2023-05-10 12:37:43,984] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... + 2: [2023-05-10 12:37:43,984] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... + 2: [2023-05-10 12:37:43,984] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +14: [2023-05-10 12:37:43,984] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt... +24: [2023-05-10 12:37:43,984] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt. +24: [2023-05-10 12:37:43,984] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt. +24: [2023-05-10 12:37:43,984] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt. +24: [2023-05-10 12:37:43,984] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt. +11: [2023-05-10 12:37:43,984] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +16: [2023-05-10 12:37:43,985] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +16: [2023-05-10 12:37:43,985] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +12: [2023-05-10 12:37:43,985] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +15: [2023-05-10 12:37:43,986] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +15: [2023-05-10 12:37:43,986] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +15: [2023-05-10 12:37:43,986] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +15: [2023-05-10 12:37:43,986] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +30: [2023-05-10 12:37:43,986] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +23: [2023-05-10 12:37:43,986] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +15: [2023-05-10 12:37:43,986] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +15: [2023-05-10 12:37:43,986] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +15: [2023-05-10 12:37:43,986] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... + 3: [2023-05-10 12:37:43,987] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... + 8: [2023-05-10 12:37:43,987] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +30: [2023-05-10 12:37:43,987] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +30: [2023-05-10 12:37:43,987] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. + 8: [2023-05-10 12:37:43,988] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt... +15: [2023-05-10 12:37:43,988] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... + 8: [2023-05-10 12:37:43,988] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. + 8: [2023-05-10 12:37:43,988] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt... + 5: [2023-05-10 12:37:43,989] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +18: [2023-05-10 12:37:43,989] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +18: [2023-05-10 12:37:43,989] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. + 2: [2023-05-10 12:37:43,989] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +14: [2023-05-10 12:37:43,989] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +18: [2023-05-10 12:37:43,989] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. + 1: [2023-05-10 12:37:43,989] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. + 1: [2023-05-10 12:37:43,989] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +23: [2023-05-10 12:37:43,990] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +14: [2023-05-10 12:37:43,990] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. + 1: [2023-05-10 12:37:43,991] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt... + 5: [2023-05-10 12:37:43,991] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +19: [2023-05-10 12:37:43,990] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +19: [2023-05-10 12:37:43,990] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +23: [2023-05-10 12:37:43,991] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... + 1: [2023-05-10 12:37:43,991] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt... + 2: [2023-05-10 12:37:43,992] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... + 2: [2023-05-10 12:37:43,992] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +12: [2023-05-10 12:37:43,993] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +24: [2023-05-10 12:37:43,993] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... + 8: [2023-05-10 12:37:43,993] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. + 8: [2023-05-10 12:37:43,993] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt... + 3: [2023-05-10 12:37:43,993] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... + 0: [2023-05-10 12:37:43,993] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. + 0: [2023-05-10 12:37:43,993] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. + 0: [2023-05-10 12:37:43,993] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +24: [2023-05-10 12:37:43,994] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +16: [2023-05-10 12:37:43,994] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +22: [2023-05-10 12:37:43,994] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +24: [2023-05-10 12:37:43,994] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +22: [2023-05-10 12:37:43,994] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +22: [2023-05-10 12:37:43,994] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +23: [2023-05-10 12:37:43,994] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +22: [2023-05-10 12:37:43,994] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +11: [2023-05-10 12:37:43,994] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... + 3: [2023-05-10 12:37:43,994] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +22: [2023-05-10 12:37:43,994] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +24: [2023-05-10 12:37:43,994] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +16: [2023-05-10 12:37:43,994] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +12: [2023-05-10 12:37:43,995] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +12: [2023-05-10 12:37:43,995] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +30: [2023-05-10 12:37:43,995] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +22: [2023-05-10 12:37:43,995] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +13: [2023-05-10 12:37:43,995] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +22: [2023-05-10 12:37:43,996] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +22: [2023-05-10 12:37:43,996] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +23: [2023-05-10 12:37:43,996] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +11: [2023-05-10 12:37:43,997] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +21: [2023-05-10 12:37:43,996] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +21: [2023-05-10 12:37:43,996] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +11: [2023-05-10 12:37:43,998] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +11: [2023-05-10 12:37:43,998] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +14: [2023-05-10 12:37:43,998] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +20: [2023-05-10 12:37:43,998] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +20: [2023-05-10 12:37:43,998] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +30: [2023-05-10 12:37:43,998] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +30: [2023-05-10 12:37:43,998] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +15: [2023-05-10 12:37:43,999] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +20: [2023-05-10 12:37:43,999] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +20: [2023-05-10 12:37:43,999] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +18: [2023-05-10 12:37:43,999] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +18: [2023-05-10 12:37:44,000] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +14: [2023-05-10 12:37:44,000] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +19: [2023-05-10 12:37:44,000] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +18: [2023-05-10 12:37:44,000] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... + 3: [2023-05-10 12:37:44,001] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. + 5: [2023-05-10 12:37:44,002] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... + 5: [2023-05-10 12:37:44,002] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +19: [2023-05-10 12:37:44,002] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt... +16: [2023-05-10 12:37:44,002] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +13: [2023-05-10 12:37:44,002] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. + 7: [2023-05-10 12:37:44,002] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +19: [2023-05-10 12:37:44,003] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +19: [2023-05-10 12:37:44,003] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... + 7: [2023-05-10 12:37:44,003] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. + 7: [2023-05-10 12:37:44,003] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... + 7: [2023-05-10 12:37:44,003] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. + 7: [2023-05-10 12:37:44,003] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... + 7: [2023-05-10 12:37:44,003] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... + 7: [2023-05-10 12:37:44,003] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +18: [2023-05-10 12:37:44,003] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +19: [2023-05-10 12:37:44,003] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +15: [2023-05-10 12:37:44,003] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. + 7: [2023-05-10 12:37:44,003] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... + 0: [2023-05-10 12:37:44,003] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... + 8: [2023-05-10 12:37:44,003] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +19: [2023-05-10 12:37:44,003] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +12: [2023-05-10 12:37:44,004] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +30: [2023-05-10 12:37:44,004] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. + 8: [2023-05-10 12:37:44,005] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt... +13: [2023-05-10 12:37:44,005] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +13: [2023-05-10 12:37:44,005] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +24: [2023-05-10 12:37:44,005] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. + 5: [2023-05-10 12:37:44,006] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +24: [2023-05-10 12:37:44,006] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +21: [2023-05-10 12:37:44,006] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +21: [2023-05-10 12:37:44,007] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +12: [2023-05-10 12:37:44,007] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +12: [2023-05-10 12:37:44,007] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +24: [2023-05-10 12:37:44,007] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +21: [2023-05-10 12:37:44,008] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +20: [2023-05-10 12:37:44,008] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... + 0: [2023-05-10 12:37:44,008] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... + 0: [2023-05-10 12:37:44,008] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +16: [2023-05-10 12:37:44,008] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +11: [2023-05-10 12:37:44,008] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +11: [2023-05-10 12:37:44,009] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... + 5: [2023-05-10 12:37:44,009] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +15: [2023-05-10 12:37:44,009] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... + 3: [2023-05-10 12:37:44,009] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +11: [2023-05-10 12:37:44,010] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +20: [2023-05-10 12:37:44,010] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +20: [2023-05-10 12:37:44,011] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +15: [2023-05-10 12:37:44,011] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +24: [2023-05-10 12:37:44,011] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt... +20: [2023-05-10 12:37:44,011] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +24: [2023-05-10 12:37:44,011] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt... +24: [2023-05-10 12:37:44,011] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt... +16: [2023-05-10 12:37:44,011] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +13: [2023-05-10 12:37:44,011] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +18: [2023-05-10 12:37:44,011] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +12: [2023-05-10 12:37:44,012] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +15: [2023-05-10 12:37:44,012] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +13: [2023-05-10 12:37:44,013] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +19: [2023-05-10 12:37:44,013] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +28: [2023-05-10 12:37:44,014] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +28: [2023-05-10 12:37:44,014] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +28: [2023-05-10 12:37:44,014] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +19: [2023-05-10 12:37:44,014] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... + 7: [2023-05-10 12:37:44,014] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +22: [2023-05-10 12:37:44,014] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +30: [2023-05-10 12:37:44,015] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +28: [2023-05-10 12:37:44,015] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +28: [2023-05-10 12:37:44,015] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +28: [2023-05-10 12:37:44,015] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +28: [2023-05-10 12:37:44,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +13: [2023-05-10 12:37:44,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +21: [2023-05-10 12:37:44,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... + 5: [2023-05-10 12:37:44,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +21: [2023-05-10 12:37:44,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +28: [2023-05-10 12:37:44,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +16: [2023-05-10 12:37:44,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... + 0: [2023-05-10 12:37:44,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +15: [2023-05-10 12:37:44,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. + 5: [2023-05-10 12:37:44,020] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +12: [2023-05-10 12:37:44,020] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +15: [2023-05-10 12:37:44,020] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +24: [2023-05-10 12:37:44,020] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +31: [2023-05-10 12:37:44,020] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt. +31: [2023-05-10 12:37:44,020] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt. +31: [2023-05-10 12:37:44,020] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt. +22: [2023-05-10 12:37:44,020] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +31: [2023-05-10 12:37:44,020] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt. +24: [2023-05-10 12:37:44,022] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt... +22: [2023-05-10 12:37:44,023] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +22: [2023-05-10 12:37:44,024] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... + 7: [2023-05-10 12:37:44,024] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. + 7: [2023-05-10 12:37:44,024] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. + 7: [2023-05-10 12:37:44,024] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +13: [2023-05-10 12:37:44,025] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +21: [2023-05-10 12:37:44,025] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +15: [2023-05-10 12:37:44,026] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... + 0: [2023-05-10 12:37:44,027] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +31: [2023-05-10 12:37:44,029] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +26: [2023-05-10 12:37:44,029] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt. +26: [2023-05-10 12:37:44,029] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt. +26: [2023-05-10 12:37:44,029] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt. + 6: [2023-05-10 12:37:44,029] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. + 6: [2023-05-10 12:37:44,029] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. + 7: [2023-05-10 12:37:44,030] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. + 6: [2023-05-10 12:37:44,030] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. + 6: [2023-05-10 12:37:44,030] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... + 6: [2023-05-10 12:37:44,030] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... + 6: [2023-05-10 12:37:44,030] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +26: [2023-05-10 12:37:44,030] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt. + 6: [2023-05-10 12:37:44,030] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +22: [2023-05-10 12:37:44,030] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +31: [2023-05-10 12:37:44,030] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +22: [2023-05-10 12:37:44,030] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +31: [2023-05-10 12:37:44,031] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... + 6: [2023-05-10 12:37:44,031] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +28: [2023-05-10 12:37:44,031] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +28: [2023-05-10 12:37:44,031] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +24: [2023-05-10 12:37:44,031] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +24: [2023-05-10 12:37:44,032] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +24: [2023-05-10 12:37:44,032] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +24: [2023-05-10 12:37:44,032] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +24: [2023-05-10 12:37:44,032] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +24: [2023-05-10 12:37:44,032] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +22: [2023-05-10 12:37:44,032] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +31: [2023-05-10 12:37:44,033] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +27: [2023-05-10 12:37:44,034] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +27: [2023-05-10 12:37:44,034] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +24: [2023-05-10 12:37:44,034] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +27: [2023-05-10 12:37:44,035] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +27: [2023-05-10 12:37:44,036] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +24: [2023-05-10 12:37:44,036] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +27: [2023-05-10 12:37:44,037] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +27: [2023-05-10 12:37:44,037] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +27: [2023-05-10 12:37:44,037] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... + 7: [2023-05-10 12:37:44,038] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... + 7: [2023-05-10 12:37:44,038] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +27: [2023-05-10 12:37:44,038] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +22: [2023-05-10 12:37:44,039] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +26: [2023-05-10 12:37:44,039] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +26: [2023-05-10 12:37:44,039] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +26: [2023-05-10 12:37:44,039] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... + 7: [2023-05-10 12:37:44,040] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +28: [2023-05-10 12:37:44,040] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +31: [2023-05-10 12:37:44,041] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +28: [2023-05-10 12:37:44,041] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +31: [2023-05-10 12:37:44,041] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt... +26: [2023-05-10 12:37:44,042] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +28: [2023-05-10 12:37:44,043] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. + 6: [2023-05-10 12:37:44,043] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +24: [2023-05-10 12:37:44,043] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +22: [2023-05-10 12:37:44,045] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt. +22: [2023-05-10 12:37:44,045] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt. +22: [2023-05-10 12:37:44,045] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt. +24: [2023-05-10 12:37:44,045] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +24: [2023-05-10 12:37:44,045] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +22: [2023-05-10 12:37:44,045] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt. + 6: [2023-05-10 12:37:44,045] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. + 6: [2023-05-10 12:37:44,045] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +28: [2023-05-10 12:37:44,046] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +27: [2023-05-10 12:37:44,046] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +27: [2023-05-10 12:37:44,048] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +31: [2023-05-10 12:37:44,048] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +31: [2023-05-10 12:37:44,048] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt... +27: [2023-05-10 12:37:44,050] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +31: [2023-05-10 12:37:44,051] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +31: [2023-05-10 12:37:44,051] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +28: [2023-05-10 12:37:44,051] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +31: [2023-05-10 12:37:44,053] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +31: [2023-05-10 12:37:44,053] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +31: [2023-05-10 12:37:44,053] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. + 6: [2023-05-10 12:37:44,053] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +31: [2023-05-10 12:37:44,053] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt... +24: [2023-05-10 12:37:44,054] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +31: [2023-05-10 12:37:44,054] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +22: [2023-05-10 12:37:44,054] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +31: [2023-05-10 12:37:44,054] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt... +22: [2023-05-10 12:37:44,054] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +31: [2023-05-10 12:37:44,055] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +31: [2023-05-10 12:37:44,055] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +24: [2023-05-10 12:37:44,055] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +24: [2023-05-10 12:37:44,055] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... + 6: [2023-05-10 12:37:44,055] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +28: [2023-05-10 12:37:44,055] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... + 6: [2023-05-10 12:37:44,055] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +26: [2023-05-10 12:37:44,055] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +27: [2023-05-10 12:37:44,056] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +31: [2023-05-10 12:37:44,056] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +31: [2023-05-10 12:37:44,056] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +26: [2023-05-10 12:37:44,056] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt... +27: [2023-05-10 12:37:44,058] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... + 6: [2023-05-10 12:37:44,059] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +22: [2023-05-10 12:37:44,059] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +22: [2023-05-10 12:37:44,059] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +27: [2023-05-10 12:37:44,060] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +26: [2023-05-10 12:37:44,061] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +26: [2023-05-10 12:37:44,061] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +26: [2023-05-10 12:37:44,061] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +26: [2023-05-10 12:37:44,061] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +26: [2023-05-10 12:37:44,062] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +26: [2023-05-10 12:37:44,062] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +26: [2023-05-10 12:37:44,062] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +26: [2023-05-10 12:37:44,062] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +26: [2023-05-10 12:37:44,062] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +26: [2023-05-10 12:37:44,063] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt... +31: [2023-05-10 12:37:44,063] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +26: [2023-05-10 12:37:44,064] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +26: [2023-05-10 12:37:44,064] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt... +27: [2023-05-10 12:37:44,065] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. + 1: [2023-05-10 12:37:44,066] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. + 1: [2023-05-10 12:37:44,066] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. + 1: [2023-05-10 12:37:44,066] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... + 1: [2023-05-10 12:37:44,066] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... + 1: [2023-05-10 12:37:44,066] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. + 1: [2023-05-10 12:37:44,066] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... + 1: [2023-05-10 12:37:44,066] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. + 1: [2023-05-10 12:37:44,067] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +24: [2023-05-10 12:37:44,067] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. + 6: [2023-05-10 12:37:44,067] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +31: [2023-05-10 12:37:44,067] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +26: [2023-05-10 12:37:44,070] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +17: [2023-05-10 12:37:44,071] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +17: [2023-05-10 12:37:44,071] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +17: [2023-05-10 12:37:44,071] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +17: [2023-05-10 12:37:44,071] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +26: [2023-05-10 12:37:44,071] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt... +17: [2023-05-10 12:37:44,072] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +17: [2023-05-10 12:37:44,072] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +22: [2023-05-10 12:37:44,072] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +22: [2023-05-10 12:37:44,072] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt... +17: [2023-05-10 12:37:44,073] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +26: [2023-05-10 12:37:44,073] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +17: [2023-05-10 12:37:44,073] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +27: [2023-05-10 12:37:44,073] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +26: [2023-05-10 12:37:44,074] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +31: [2023-05-10 12:37:44,074] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... + 9: [2023-05-10 12:37:44,075] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. + 9: [2023-05-10 12:37:44,075] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. + 9: [2023-05-10 12:37:44,075] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... + 9: [2023-05-10 12:37:44,075] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +24: [2023-05-10 12:37:44,076] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... + 9: [2023-05-10 12:37:44,076] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... + 9: [2023-05-10 12:37:44,076] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... + 9: [2023-05-10 12:37:44,076] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. + 9: [2023-05-10 12:37:44,076] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +31: [2023-05-10 12:37:44,076] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +22: [2023-05-10 12:37:44,077] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +22: [2023-05-10 12:37:44,077] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt... +26: [2023-05-10 12:37:44,078] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. + 5: [2023-05-10 12:37:44,080] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt. + 5: [2023-05-10 12:37:44,080] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt. + 5: [2023-05-10 12:37:44,080] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt. +31: [2023-05-10 12:37:44,080] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. + 5: [2023-05-10 12:37:44,081] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt. +30: [2023-05-10 12:37:44,080] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt. +30: [2023-05-10 12:37:44,080] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt. +22: [2023-05-10 12:37:44,081] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +17: [2023-05-10 12:37:44,082] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. + 4: [2023-05-10 12:37:44,082] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. + 4: [2023-05-10 12:37:44,082] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. + 4: [2023-05-10 12:37:44,082] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. + 4: [2023-05-10 12:37:44,082] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... + 4: [2023-05-10 12:37:44,082] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... + 1: [2023-05-10 12:37:44,082] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. + 1: [2023-05-10 12:37:44,082] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. + 1: [2023-05-10 12:37:44,082] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. + 1: [2023-05-10 12:37:44,083] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. + 4: [2023-05-10 12:37:44,083] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. + 4: [2023-05-10 12:37:44,083] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +25: [2023-05-10 12:37:44,083] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt. +25: [2023-05-10 12:37:44,083] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt. +22: [2023-05-10 12:37:44,083] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt... +25: [2023-05-10 12:37:44,083] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt. +31: [2023-05-10 12:37:44,084] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +16: [2023-05-10 12:37:44,084] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt. +16: [2023-05-10 12:37:44,084] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt. +16: [2023-05-10 12:37:44,084] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt. +25: [2023-05-10 12:37:44,084] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt. +20: [2023-05-10 12:37:44,084] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt. + 4: [2023-05-10 12:37:44,084] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +26: [2023-05-10 12:37:44,084] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +20: [2023-05-10 12:37:44,084] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt. +20: [2023-05-10 12:37:44,084] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt. +16: [2023-05-10 12:37:44,084] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt. + 3: [2023-05-10 12:37:44,084] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt. + 3: [2023-05-10 12:37:44,084] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt. +30: [2023-05-10 12:37:44,084] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt. +30: [2023-05-10 12:37:44,085] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt. + 3: [2023-05-10 12:37:44,085] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt. +20: [2023-05-10 12:37:44,085] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt. +26: [2023-05-10 12:37:44,085] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +17: [2023-05-10 12:37:44,085] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. + 3: [2023-05-10 12:37:44,085] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt. +11: [2023-05-10 12:37:44,087] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt. +11: [2023-05-10 12:37:44,087] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt. +11: [2023-05-10 12:37:44,087] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt. +11: [2023-05-10 12:37:44,087] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt. + 9: [2023-05-10 12:37:44,088] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. + 4: [2023-05-10 12:37:44,088] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt. + 4: [2023-05-10 12:37:44,088] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt. +26: [2023-05-10 12:37:44,088] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +26: [2023-05-10 12:37:44,088] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +31: [2023-05-10 12:37:44,089] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... + 9: [2023-05-10 12:37:44,089] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +30: [2023-05-10 12:37:44,090] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +30: [2023-05-10 12:37:44,090] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... + 5: [2023-05-10 12:37:44,091] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... + 9: [2023-05-10 12:37:44,091] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. + 4: [2023-05-10 12:37:44,091] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt. + 5: [2023-05-10 12:37:44,091] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... + 9: [2023-05-10 12:37:44,091] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. + 5: [2023-05-10 12:37:44,091] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... + 5: [2023-05-10 12:37:44,091] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +22: [2023-05-10 12:37:44,091] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. + 4: [2023-05-10 12:37:44,091] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt. + 1: [2023-05-10 12:37:44,092] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +25: [2023-05-10 12:37:44,092] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +17: [2023-05-10 12:37:44,092] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... + 1: [2023-05-10 12:37:44,092] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +25: [2023-05-10 12:37:44,092] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +22: [2023-05-10 12:37:44,092] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt... +25: [2023-05-10 12:37:44,093] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... + 1: [2023-05-10 12:37:44,093] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... + 1: [2023-05-10 12:37:44,093] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +25: [2023-05-10 12:37:44,093] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... + 3: [2023-05-10 12:37:44,094] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... + 3: [2023-05-10 12:37:44,094] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +16: [2023-05-10 12:37:44,094] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +16: [2023-05-10 12:37:44,094] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +20: [2023-05-10 12:37:44,094] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +31: [2023-05-10 12:37:44,094] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +30: [2023-05-10 12:37:44,094] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... + 0: [2023-05-10 12:37:44,094] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt. +29: [2023-05-10 12:37:44,094] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. + 0: [2023-05-10 12:37:44,094] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt. + 0: [2023-05-10 12:37:44,094] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt. +29: [2023-05-10 12:37:44,094] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... + 0: [2023-05-10 12:37:44,095] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt. + 3: [2023-05-10 12:37:44,095] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +20: [2023-05-10 12:37:44,095] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +29: [2023-05-10 12:37:44,095] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +16: [2023-05-10 12:37:44,095] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +29: [2023-05-10 12:37:44,095] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... + 3: [2023-05-10 12:37:44,095] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +20: [2023-05-10 12:37:44,095] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +20: [2023-05-10 12:37:44,096] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +29: [2023-05-10 12:37:44,096] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +29: [2023-05-10 12:37:44,096] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +29: [2023-05-10 12:37:44,096] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +16: [2023-05-10 12:37:44,096] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... + 9: [2023-05-10 12:37:44,097] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +11: [2023-05-10 12:37:44,097] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +26: [2023-05-10 12:37:44,097] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +11: [2023-05-10 12:37:44,097] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +30: [2023-05-10 12:37:44,097] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +11: [2023-05-10 12:37:44,097] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +11: [2023-05-10 12:37:44,097] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +29: [2023-05-10 12:37:44,097] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +17: [2023-05-10 12:37:44,097] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... + 4: [2023-05-10 12:37:44,098] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... + 4: [2023-05-10 12:37:44,098] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +17: [2023-05-10 12:37:44,098] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. + 9: [2023-05-10 12:37:44,100] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +17: [2023-05-10 12:37:44,100] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. + 4: [2023-05-10 12:37:44,102] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. + 4: [2023-05-10 12:37:44,102] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. + 4: [2023-05-10 12:37:44,102] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... + 9: [2023-05-10 12:37:44,102] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... + 4: [2023-05-10 12:37:44,102] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. + 4: [2023-05-10 12:37:44,102] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... + 9: [2023-05-10 12:37:44,103] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +17: [2023-05-10 12:37:44,104] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt. +25: [2023-05-10 12:37:44,105] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +17: [2023-05-10 12:37:44,105] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt. +17: [2023-05-10 12:37:44,105] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt. +25: [2023-05-10 12:37:44,105] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +25: [2023-05-10 12:37:44,105] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt... +25: [2023-05-10 12:37:44,106] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt... + 0: [2023-05-10 12:37:44,106] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +29: [2023-05-10 12:37:44,106] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. + 0: [2023-05-10 12:37:44,106] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... + 0: [2023-05-10 12:37:44,106] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... + 0: [2023-05-10 12:37:44,106] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +17: [2023-05-10 12:37:44,106] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt. +20: [2023-05-10 12:37:44,106] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +20: [2023-05-10 12:37:44,106] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt... +25: [2023-05-10 12:37:44,107] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +25: [2023-05-10 12:37:44,107] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt... +25: [2023-05-10 12:37:44,108] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +25: [2023-05-10 12:37:44,108] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt... + 5: [2023-05-10 12:37:44,108] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. + 5: [2023-05-10 12:37:44,109] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +17: [2023-05-10 12:37:44,109] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +16: [2023-05-10 12:37:44,109] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. + 3: [2023-05-10 12:37:44,109] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. + 3: [2023-05-10 12:37:44,109] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +16: [2023-05-10 12:37:44,109] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. + 5: [2023-05-10 12:37:44,110] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +16: [2023-05-10 12:37:44,110] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt... +16: [2023-05-10 12:37:44,110] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt... + 3: [2023-05-10 12:37:44,110] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt... + 5: [2023-05-10 12:37:44,110] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt... + 3: [2023-05-10 12:37:44,110] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt... + 5: [2023-05-10 12:37:44,110] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt... + 5: [2023-05-10 12:37:44,110] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt... +30: [2023-05-10 12:37:44,109] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +30: [2023-05-10 12:37:44,109] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +30: [2023-05-10 12:37:44,110] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt... +30: [2023-05-10 12:37:44,110] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt... +17: [2023-05-10 12:37:44,110] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +11: [2023-05-10 12:37:44,111] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +29: [2023-05-10 12:37:44,111] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +29: [2023-05-10 12:37:44,111] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +30: [2023-05-10 12:37:44,111] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +30: [2023-05-10 12:37:44,112] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt... +11: [2023-05-10 12:37:44,112] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt... + 4: [2023-05-10 12:37:44,112] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +20: [2023-05-10 12:37:44,112] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +20: [2023-05-10 12:37:44,112] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt... + 3: [2023-05-10 12:37:44,112] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. + 3: [2023-05-10 12:37:44,113] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt... + 3: [2023-05-10 12:37:44,113] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. + 3: [2023-05-10 12:37:44,113] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt... + 4: [2023-05-10 12:37:44,113] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +30: [2023-05-10 12:37:44,113] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +30: [2023-05-10 12:37:44,113] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt... +17: [2023-05-10 12:37:44,114] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... + 5: [2023-05-10 12:37:44,114] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. + 5: [2023-05-10 12:37:44,114] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt... +11: [2023-05-10 12:37:44,114] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +11: [2023-05-10 12:37:44,114] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt... +20: [2023-05-10 12:37:44,114] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +20: [2023-05-10 12:37:44,114] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt... +11: [2023-05-10 12:37:44,115] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. + 4: [2023-05-10 12:37:44,115] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +11: [2023-05-10 12:37:44,115] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt... + 4: [2023-05-10 12:37:44,115] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +17: [2023-05-10 12:37:44,115] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... + 4: [2023-05-10 12:37:44,115] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt... + 4: [2023-05-10 12:37:44,115] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt... +20: [2023-05-10 12:37:44,115] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +20: [2023-05-10 12:37:44,115] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt... +17: [2023-05-10 12:37:44,115] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +16: [2023-05-10 12:37:44,115] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +16: [2023-05-10 12:37:44,115] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt... + 4: [2023-05-10 12:37:44,116] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +17: [2023-05-10 12:37:44,116] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +11: [2023-05-10 12:37:44,116] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +29: [2023-05-10 12:37:44,116] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +11: [2023-05-10 12:37:44,116] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt... + 4: [2023-05-10 12:37:44,118] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +16: [2023-05-10 12:37:44,120] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. + 0: [2023-05-10 12:37:44,121] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +16: [2023-05-10 12:37:44,121] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt... + 0: [2023-05-10 12:37:44,121] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt... +29: [2023-05-10 12:37:44,121] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. + 4: [2023-05-10 12:37:44,122] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. + 4: [2023-05-10 12:37:44,122] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. + 4: [2023-05-10 12:37:44,122] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt... + 4: [2023-05-10 12:37:44,122] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt... +29: [2023-05-10 12:37:44,122] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt. +29: [2023-05-10 12:37:44,122] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt. +29: [2023-05-10 12:37:44,122] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt. +29: [2023-05-10 12:37:44,123] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt. +29: [2023-05-10 12:37:44,123] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +29: [2023-05-10 12:37:44,123] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... + 0: [2023-05-10 12:37:44,124] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. + 0: [2023-05-10 12:37:44,124] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt... + 9: [2023-05-10 12:37:44,124] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt. + 9: [2023-05-10 12:37:44,124] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt. + 9: [2023-05-10 12:37:44,124] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt. + 9: [2023-05-10 12:37:44,124] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt. + 0: [2023-05-10 12:37:44,125] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. + 0: [2023-05-10 12:37:44,125] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt... + 4: [2023-05-10 12:37:44,127] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... + 0: [2023-05-10 12:37:44,130] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. + 0: [2023-05-10 12:37:44,130] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt... +17: [2023-05-10 12:37:44,130] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +17: [2023-05-10 12:37:44,131] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt... +29: [2023-05-10 12:37:44,132] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +14: [2023-05-10 12:37:44,132] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt. +14: [2023-05-10 12:37:44,132] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt. +14: [2023-05-10 12:37:44,132] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt. +17: [2023-05-10 12:37:44,132] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +14: [2023-05-10 12:37:44,132] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt. +29: [2023-05-10 12:37:44,133] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +17: [2023-05-10 12:37:44,133] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +17: [2023-05-10 12:37:44,133] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt... +17: [2023-05-10 12:37:44,133] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt... +29: [2023-05-10 12:37:44,133] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +29: [2023-05-10 12:37:44,133] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +17: [2023-05-10 12:37:44,133] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +29: [2023-05-10 12:37:44,133] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +17: [2023-05-10 12:37:44,133] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt... + 9: [2023-05-10 12:37:44,133] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... + 9: [2023-05-10 12:37:44,134] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... + 9: [2023-05-10 12:37:44,135] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... + 9: [2023-05-10 12:37:44,138] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +14: [2023-05-10 12:37:44,141] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +14: [2023-05-10 12:37:44,141] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +14: [2023-05-10 12:37:44,142] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +14: [2023-05-10 12:37:44,144] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... + 9: [2023-05-10 12:37:44,145] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. + 9: [2023-05-10 12:37:44,146] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt... +29: [2023-05-10 12:37:44,148] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +29: [2023-05-10 12:37:44,148] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt... + 9: [2023-05-10 12:37:44,150] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. + 9: [2023-05-10 12:37:44,150] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt... +29: [2023-05-10 12:37:44,151] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +29: [2023-05-10 12:37:44,151] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +29: [2023-05-10 12:37:44,151] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt... +29: [2023-05-10 12:37:44,151] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt... + 9: [2023-05-10 12:37:44,151] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. + 9: [2023-05-10 12:37:44,151] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt... +29: [2023-05-10 12:37:44,152] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +29: [2023-05-10 12:37:44,153] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt... + 9: [2023-05-10 12:37:44,164] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. + 9: [2023-05-10 12:37:44,166] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt... +21: [2023-05-10 12:37:44,170] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt. +21: [2023-05-10 12:37:44,170] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt. +21: [2023-05-10 12:37:44,170] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt. + 6: [2023-05-10 12:37:44,170] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt. + 6: [2023-05-10 12:37:44,170] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt. + 6: [2023-05-10 12:37:44,170] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt. +21: [2023-05-10 12:37:44,171] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt. + 6: [2023-05-10 12:37:44,174] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt. +18: [2023-05-10 12:37:44,177] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt. +18: [2023-05-10 12:37:44,177] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt. +18: [2023-05-10 12:37:44,177] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt. +18: [2023-05-10 12:37:44,178] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt. + 6: [2023-05-10 12:37:44,180] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... + 6: [2023-05-10 12:37:44,180] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... + 6: [2023-05-10 12:37:44,180] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +21: [2023-05-10 12:37:44,181] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +28: [2023-05-10 12:37:44,181] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt. +28: [2023-05-10 12:37:44,181] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt. +28: [2023-05-10 12:37:44,181] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt. +28: [2023-05-10 12:37:44,181] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt. +21: [2023-05-10 12:37:44,182] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +21: [2023-05-10 12:37:44,182] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +21: [2023-05-10 12:37:44,183] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... + 6: [2023-05-10 12:37:44,184] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +18: [2023-05-10 12:37:44,187] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +18: [2023-05-10 12:37:44,187] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +18: [2023-05-10 12:37:44,187] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +18: [2023-05-10 12:37:44,189] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +28: [2023-05-10 12:37:44,191] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +28: [2023-05-10 12:37:44,193] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +28: [2023-05-10 12:37:44,193] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +28: [2023-05-10 12:37:44,193] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... + 6: [2023-05-10 12:37:44,194] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. + 6: [2023-05-10 12:37:44,194] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt... +21: [2023-05-10 12:37:44,197] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +21: [2023-05-10 12:37:44,197] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +21: [2023-05-10 12:37:44,198] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt... +21: [2023-05-10 12:37:44,198] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt... +12: [2023-05-10 12:37:44,198] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt. +12: [2023-05-10 12:37:44,198] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt. + 6: [2023-05-10 12:37:44,198] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. + 6: [2023-05-10 12:37:44,198] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt... +10: [2023-05-10 12:37:44,198] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt. +10: [2023-05-10 12:37:44,198] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt. +12: [2023-05-10 12:37:44,198] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt. +12: [2023-05-10 12:37:44,198] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt. +10: [2023-05-10 12:37:44,199] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt. +23: [2023-05-10 12:37:44,199] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt. +23: [2023-05-10 12:37:44,199] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt. +10: [2023-05-10 12:37:44,199] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt. +23: [2023-05-10 12:37:44,200] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt. +23: [2023-05-10 12:37:44,200] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt. + 6: [2023-05-10 12:37:44,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +13: [2023-05-10 12:37:44,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt. + 6: [2023-05-10 12:37:44,201] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt... +13: [2023-05-10 12:37:44,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt. + 7: [2023-05-10 12:37:44,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt. + 7: [2023-05-10 12:37:44,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt. + 7: [2023-05-10 12:37:44,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt. +21: [2023-05-10 12:37:44,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +13: [2023-05-10 12:37:44,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt. +21: [2023-05-10 12:37:44,201] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt... + 7: [2023-05-10 12:37:44,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt. + 2: [2023-05-10 12:37:44,203] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt. + 2: [2023-05-10 12:37:44,203] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt. + 2: [2023-05-10 12:37:44,203] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt. + 6: [2023-05-10 12:37:44,203] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +13: [2023-05-10 12:37:44,203] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt. + 6: [2023-05-10 12:37:44,203] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt... + 2: [2023-05-10 12:37:44,203] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt. +28: [2023-05-10 12:37:44,203] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +28: [2023-05-10 12:37:44,204] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt... +28: [2023-05-10 12:37:44,205] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +28: [2023-05-10 12:37:44,205] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt... +28: [2023-05-10 12:37:44,205] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +18: [2023-05-10 12:37:44,205] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +28: [2023-05-10 12:37:44,206] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +18: [2023-05-10 12:37:44,206] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +28: [2023-05-10 12:37:44,206] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt... +18: [2023-05-10 12:37:44,207] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt... +18: [2023-05-10 12:37:44,207] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt... +25: [2023-05-10 12:37:44,207] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +25: [2023-05-10 12:37:44,207] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +25: [2023-05-10 12:37:44,207] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +25: [2023-05-10 12:37:44,207] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +25: [2023-05-10 12:37:44,207] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +12: [2023-05-10 12:37:44,207] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +25: [2023-05-10 12:37:44,207] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +25: [2023-05-10 12:37:44,207] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +25: [2023-05-10 12:37:44,208] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +28: [2023-05-10 12:37:44,208] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt... +12: [2023-05-10 12:37:44,208] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +10: [2023-05-10 12:37:44,208] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +10: [2023-05-10 12:37:44,208] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +21: [2023-05-10 12:37:44,208] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +18: [2023-05-10 12:37:44,208] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +18: [2023-05-10 12:37:44,208] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +15: [2023-05-10 12:37:44,208] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt. +15: [2023-05-10 12:37:44,208] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt. +15: [2023-05-10 12:37:44,208] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt. +12: [2023-05-10 12:37:44,209] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +23: [2023-05-10 12:37:44,209] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +12: [2023-05-10 12:37:44,209] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +23: [2023-05-10 12:37:44,209] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +15: [2023-05-10 12:37:44,209] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt. +21: [2023-05-10 12:37:44,210] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt... +10: [2023-05-10 12:37:44,210] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +10: [2023-05-10 12:37:44,210] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +10: [2023-05-10 12:37:44,210] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +10: [2023-05-10 12:37:44,210] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +10: [2023-05-10 12:37:44,210] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +10: [2023-05-10 12:37:44,210] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +23: [2023-05-10 12:37:44,210] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +23: [2023-05-10 12:37:44,210] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +10: [2023-05-10 12:37:44,211] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +10: [2023-05-10 12:37:44,211] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +10: [2023-05-10 12:37:44,211] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... + 7: [2023-05-10 12:37:44,212] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... + 2: [2023-05-10 12:37:44,212] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +10: [2023-05-10 12:37:44,213] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +13: [2023-05-10 12:37:44,213] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +13: [2023-05-10 12:37:44,213] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... + 2: [2023-05-10 12:37:44,213] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... + 7: [2023-05-10 12:37:44,213] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... + 2: [2023-05-10 12:37:44,213] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +18: [2023-05-10 12:37:44,208] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt... +18: [2023-05-10 12:37:44,208] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt... + 2: [2023-05-10 12:37:44,213] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... + 7: [2023-05-10 12:37:44,215] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +13: [2023-05-10 12:37:44,215] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... + 7: [2023-05-10 12:37:44,215] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +13: [2023-05-10 12:37:44,215] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +15: [2023-05-10 12:37:44,218] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +15: [2023-05-10 12:37:44,219] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +25: [2023-05-10 12:37:44,218] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +25: [2023-05-10 12:37:44,219] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +15: [2023-05-10 12:37:44,219] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +12: [2023-05-10 12:37:44,220] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +15: [2023-05-10 12:37:44,220] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +12: [2023-05-10 12:37:44,220] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +12: [2023-05-10 12:37:44,221] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt... +12: [2023-05-10 12:37:44,221] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt... +27: [2023-05-10 12:37:44,221] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt. +27: [2023-05-10 12:37:44,221] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt. +12: [2023-05-10 12:37:44,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +12: [2023-05-10 12:37:44,222] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt... +25: [2023-05-10 12:37:44,223] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +25: [2023-05-10 12:37:44,223] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +12: [2023-05-10 12:37:44,223] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +12: [2023-05-10 12:37:44,223] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt... +23: [2023-05-10 12:37:44,223] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +23: [2023-05-10 12:37:44,224] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +10: [2023-05-10 12:37:44,224] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +23: [2023-05-10 12:37:44,224] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt... +23: [2023-05-10 12:37:44,224] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt... +10: [2023-05-10 12:37:44,224] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt... +27: [2023-05-10 12:37:44,226] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt. +23: [2023-05-10 12:37:44,226] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +23: [2023-05-10 12:37:44,226] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. + 2: [2023-05-10 12:37:44,226] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +27: [2023-05-10 12:37:44,227] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_21-model_01-model_states.pt. +13: [2023-05-10 12:37:44,227] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +23: [2023-05-10 12:37:44,226] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt... +23: [2023-05-10 12:37:44,226] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt... + 7: [2023-05-10 12:37:44,226] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +13: [2023-05-10 12:37:44,227] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. + 2: [2023-05-10 12:37:44,227] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt... + 7: [2023-05-10 12:37:44,227] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt... + 2: [2023-05-10 12:37:44,227] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. + 2: [2023-05-10 12:37:44,227] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt... +13: [2023-05-10 12:37:44,228] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt... +13: [2023-05-10 12:37:44,228] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt... +10: [2023-05-10 12:37:44,228] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +10: [2023-05-10 12:37:44,228] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. + 7: [2023-05-10 12:37:44,228] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. + 7: [2023-05-10 12:37:44,228] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. + 7: [2023-05-10 12:37:44,228] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt... + 2: [2023-05-10 12:37:44,229] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. + 2: [2023-05-10 12:37:44,229] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. + 2: [2023-05-10 12:37:44,229] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt... + 2: [2023-05-10 12:37:44,229] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt... +10: [2023-05-10 12:37:44,230] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +10: [2023-05-10 12:37:44,230] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt... + 7: [2023-05-10 12:37:44,230] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt... +25: [2023-05-10 12:37:44,230] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +10: [2023-05-10 12:37:44,230] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +10: [2023-05-10 12:37:44,230] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. + 2: [2023-05-10 12:37:44,230] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. + 2: [2023-05-10 12:37:44,230] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. + 2: [2023-05-10 12:37:44,230] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +10: [2023-05-10 12:37:44,230] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt... + 2: [2023-05-10 12:37:44,230] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +25: [2023-05-10 12:37:44,230] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +10: [2023-05-10 12:37:44,230] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt... + 2: [2023-05-10 12:37:44,230] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... + 2: [2023-05-10 12:37:44,230] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... + 2: [2023-05-10 12:37:44,230] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. + 8: [2023-05-10 12:37:44,231] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. + 8: [2023-05-10 12:37:44,231] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +13: [2023-05-10 12:37:44,230] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +13: [2023-05-10 12:37:44,231] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt... + 8: [2023-05-10 12:37:44,231] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. + 8: [2023-05-10 12:37:44,231] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... + 8: [2023-05-10 12:37:44,231] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. + 8: [2023-05-10 12:37:44,231] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... + 2: [2023-05-10 12:37:44,232] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +27: [2023-05-10 12:37:44,232] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... + 8: [2023-05-10 12:37:44,232] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. + 8: [2023-05-10 12:37:44,233] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +25: [2023-05-10 12:37:44,233] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +25: [2023-05-10 12:37:44,234] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +10: [2023-05-10 12:37:44,234] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +27: [2023-05-10 12:37:44,234] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +27: [2023-05-10 12:37:44,236] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +27: [2023-05-10 12:37:44,237] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt... +15: [2023-05-10 12:37:44,237] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +15: [2023-05-10 12:37:44,238] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +10: [2023-05-10 12:37:44,238] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +15: [2023-05-10 12:37:44,238] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt... +15: [2023-05-10 12:37:44,238] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt... +10: [2023-05-10 12:37:44,239] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... + 7: [2023-05-10 12:37:44,240] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. + 8: [2023-05-10 12:37:44,241] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt. + 8: [2023-05-10 12:37:44,241] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt. + 8: [2023-05-10 12:37:44,241] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt. + 8: [2023-05-10 12:37:44,241] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt. + 7: [2023-05-10 12:37:44,241] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt... +16: [2023-05-10 12:37:44,241] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +16: [2023-05-10 12:37:44,241] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +16: [2023-05-10 12:37:44,241] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +16: [2023-05-10 12:37:44,242] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +16: [2023-05-10 12:37:44,242] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. + 1: [2023-05-10 12:37:44,242] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt. + 1: [2023-05-10 12:37:44,242] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt. +16: [2023-05-10 12:37:44,242] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +24: [2023-05-10 12:37:44,242] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt. +16: [2023-05-10 12:37:44,242] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +24: [2023-05-10 12:37:44,242] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt. +24: [2023-05-10 12:37:44,242] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt. +24: [2023-05-10 12:37:44,242] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt. + 1: [2023-05-10 12:37:44,242] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt. + 1: [2023-05-10 12:37:44,243] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt. + 2: [2023-05-10 12:37:44,243] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +15: [2023-05-10 12:37:44,243] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +15: [2023-05-10 12:37:44,243] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt... +16: [2023-05-10 12:37:44,243] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +13: [2023-05-10 12:37:44,243] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. + 2: [2023-05-10 12:37:44,244] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +10: [2023-05-10 12:37:44,244] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +15: [2023-05-10 12:37:44,244] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +15: [2023-05-10 12:37:44,244] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt... +13: [2023-05-10 12:37:44,244] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt... + 2: [2023-05-10 12:37:44,244] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. + 8: [2023-05-10 12:37:44,246] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +27: [2023-05-10 12:37:44,247] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +27: [2023-05-10 12:37:44,248] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt... +27: [2023-05-10 12:37:44,249] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. +27: [2023-05-10 12:37:44,249] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt... +27: [2023-05-10 12:37:44,250] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. + 8: [2023-05-10 12:37:44,251] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... + 1: [2023-05-10 12:37:44,251] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... + 1: [2023-05-10 12:37:44,251] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... + 8: [2023-05-10 12:37:44,251] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +27: [2023-05-10 12:37:44,251] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt... + 2: [2023-05-10 12:37:44,252] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +10: [2023-05-10 12:37:44,252] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. + 1: [2023-05-10 12:37:44,253] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... + 1: [2023-05-10 12:37:44,253] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +16: [2023-05-10 12:37:44,253] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. + 2: [2023-05-10 12:37:44,253] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... + 8: [2023-05-10 12:37:44,252] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +24: [2023-05-10 12:37:44,252] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... + 8: [2023-05-10 12:37:44,252] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +24: [2023-05-10 12:37:44,252] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +24: [2023-05-10 12:37:44,252] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +24: [2023-05-10 12:37:44,252] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +16: [2023-05-10 12:37:44,255] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. + 2: [2023-05-10 12:37:44,255] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +16: [2023-05-10 12:37:44,258] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +27: [2023-05-10 12:37:44,258] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_00-model_states.pt. + 8: [2023-05-10 12:37:44,259] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +27: [2023-05-10 12:37:44,259] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt... + 8: [2023-05-10 12:37:44,260] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. + 8: [2023-05-10 12:37:44,260] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. + 8: [2023-05-10 12:37:44,260] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +10: [2023-05-10 12:37:44,261] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +16: [2023-05-10 12:37:44,261] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... + 2: [2023-05-10 12:37:44,261] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +24: [2023-05-10 12:37:44,264] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +24: [2023-05-10 12:37:44,264] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +24: [2023-05-10 12:37:44,265] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt... +24: [2023-05-10 12:37:44,265] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt... + 1: [2023-05-10 12:37:44,266] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. + 1: [2023-05-10 12:37:44,266] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +24: [2023-05-10 12:37:44,267] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +24: [2023-05-10 12:37:44,267] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt... +19: [2023-05-10 12:37:44,267] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt. +19: [2023-05-10 12:37:44,267] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt. +16: [2023-05-10 12:37:44,267] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... + 1: [2023-05-10 12:37:44,268] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt... + 1: [2023-05-10 12:37:44,268] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt... +16: [2023-05-10 12:37:44,268] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +19: [2023-05-10 12:37:44,269] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt. + 8: [2023-05-10 12:37:44,271] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. + 8: [2023-05-10 12:37:44,271] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. + 2: [2023-05-10 12:37:44,271] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... + 8: [2023-05-10 12:37:44,271] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +19: [2023-05-10 12:37:44,271] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt. +16: [2023-05-10 12:37:44,272] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... + 8: [2023-05-10 12:37:44,272] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt... + 8: [2023-05-10 12:37:44,272] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... + 8: [2023-05-10 12:37:44,272] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt... + 8: [2023-05-10 12:37:44,272] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +24: [2023-05-10 12:37:44,273] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +24: [2023-05-10 12:37:44,273] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt... + 1: [2023-05-10 12:37:44,275] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. + 1: [2023-05-10 12:37:44,275] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. + 1: [2023-05-10 12:37:44,275] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt... + 1: [2023-05-10 12:37:44,275] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt... +19: [2023-05-10 12:37:44,278] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +16: [2023-05-10 12:37:44,278] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... + 8: [2023-05-10 12:37:44,278] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. + 8: [2023-05-10 12:37:44,278] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt... + 8: [2023-05-10 12:37:44,278] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. + 8: [2023-05-10 12:37:44,278] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt... +19: [2023-05-10 12:37:44,280] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... + 5: [2023-05-10 12:37:44,280] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. + 5: [2023-05-10 12:37:44,280] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. + 5: [2023-05-10 12:37:44,280] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. + 5: [2023-05-10 12:37:44,280] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... + 5: [2023-05-10 12:37:44,280] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... + 5: [2023-05-10 12:37:44,280] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... + 5: [2023-05-10 12:37:44,280] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. + 5: [2023-05-10 12:37:44,281] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +19: [2023-05-10 12:37:44,284] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +19: [2023-05-10 12:37:44,284] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +26: [2023-05-10 12:37:44,294] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt. +26: [2023-05-10 12:37:44,294] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt. +26: [2023-05-10 12:37:44,294] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt. +26: [2023-05-10 12:37:44,294] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt. + 5: [2023-05-10 12:37:44,296] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. + 5: [2023-05-10 12:37:44,296] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. + 5: [2023-05-10 12:37:44,296] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. + 5: [2023-05-10 12:37:44,297] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +26: [2023-05-10 12:37:44,304] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +26: [2023-05-10 12:37:44,305] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +26: [2023-05-10 12:37:44,305] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +26: [2023-05-10 12:37:44,305] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... + 5: [2023-05-10 12:37:44,305] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... + 5: [2023-05-10 12:37:44,306] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... + 5: [2023-05-10 12:37:44,307] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... + 5: [2023-05-10 12:37:44,308] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +15: [2023-05-10 12:37:44,317] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +15: [2023-05-10 12:37:44,317] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +15: [2023-05-10 12:37:44,317] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +15: [2023-05-10 12:37:44,317] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +15: [2023-05-10 12:37:44,317] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +15: [2023-05-10 12:37:44,317] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +15: [2023-05-10 12:37:44,318] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +15: [2023-05-10 12:37:44,318] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +22: [2023-05-10 12:37:44,319] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +22: [2023-05-10 12:37:44,319] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +22: [2023-05-10 12:37:44,319] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +22: [2023-05-10 12:37:44,319] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +22: [2023-05-10 12:37:44,319] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +22: [2023-05-10 12:37:44,319] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +22: [2023-05-10 12:37:44,319] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +22: [2023-05-10 12:37:44,319] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +23: [2023-05-10 12:37:44,322] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +23: [2023-05-10 12:37:44,322] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +26: [2023-05-10 12:37:44,322] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +23: [2023-05-10 12:37:44,322] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +23: [2023-05-10 12:37:44,322] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +26: [2023-05-10 12:37:44,323] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +26: [2023-05-10 12:37:44,323] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt... +26: [2023-05-10 12:37:44,323] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt... +23: [2023-05-10 12:37:44,324] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +23: [2023-05-10 12:37:44,324] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +23: [2023-05-10 12:37:44,325] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +26: [2023-05-10 12:37:44,326] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +26: [2023-05-10 12:37:44,326] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +26: [2023-05-10 12:37:44,326] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt... +26: [2023-05-10 12:37:44,326] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt... +23: [2023-05-10 12:37:44,327] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +14: [2023-05-10 12:37:44,328] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +14: [2023-05-10 12:37:44,328] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +14: [2023-05-10 12:37:44,328] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +14: [2023-05-10 12:37:44,328] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +14: [2023-05-10 12:37:44,328] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +14: [2023-05-10 12:37:44,328] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +14: [2023-05-10 12:37:44,328] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +14: [2023-05-10 12:37:44,328] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +14: [2023-05-10 12:37:44,328] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +14: [2023-05-10 12:37:44,328] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +14: [2023-05-10 12:37:44,328] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +14: [2023-05-10 12:37:44,328] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +14: [2023-05-10 12:37:44,329] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt... +14: [2023-05-10 12:37:44,329] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt... +14: [2023-05-10 12:37:44,329] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt... +13: [2023-05-10 12:37:44,329] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +13: [2023-05-10 12:37:44,329] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +13: [2023-05-10 12:37:44,329] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +13: [2023-05-10 12:37:44,329] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +13: [2023-05-10 12:37:44,329] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +13: [2023-05-10 12:37:44,329] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +13: [2023-05-10 12:37:44,329] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +13: [2023-05-10 12:37:44,329] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +14: [2023-05-10 12:37:44,329] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt... + 5: [2023-05-10 12:37:44,330] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt. + 5: [2023-05-10 12:37:44,330] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt. + 5: [2023-05-10 12:37:44,330] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt. +15: [2023-05-10 12:37:44,329] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. + 5: [2023-05-10 12:37:44,330] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt. +22: [2023-05-10 12:37:44,330] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +27: [2023-05-10 12:37:44,332] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +27: [2023-05-10 12:37:44,332] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +27: [2023-05-10 12:37:44,332] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +27: [2023-05-10 12:37:44,332] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +18: [2023-05-10 12:37:44,331] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +18: [2023-05-10 12:37:44,331] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +18: [2023-05-10 12:37:44,332] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +18: [2023-05-10 12:37:44,332] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +18: [2023-05-10 12:37:44,332] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +18: [2023-05-10 12:37:44,332] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +27: [2023-05-10 12:37:44,332] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +18: [2023-05-10 12:37:44,332] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +27: [2023-05-10 12:37:44,332] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +27: [2023-05-10 12:37:44,332] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +20: [2023-05-10 12:37:44,332] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +18: [2023-05-10 12:37:44,332] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +27: [2023-05-10 12:37:44,332] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +20: [2023-05-10 12:37:44,332] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +20: [2023-05-10 12:37:44,332] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +20: [2023-05-10 12:37:44,332] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +15: [2023-05-10 12:37:44,333] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +23: [2023-05-10 12:37:44,333] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +20: [2023-05-10 12:37:44,334] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +20: [2023-05-10 12:37:44,334] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +23: [2023-05-10 12:37:44,334] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +11: [2023-05-10 12:37:44,335] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +11: [2023-05-10 12:37:44,335] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +11: [2023-05-10 12:37:44,335] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +11: [2023-05-10 12:37:44,335] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +11: [2023-05-10 12:37:44,335] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +11: [2023-05-10 12:37:44,335] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +11: [2023-05-10 12:37:44,335] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +11: [2023-05-10 12:37:44,335] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +20: [2023-05-10 12:37:44,336] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +20: [2023-05-10 12:37:44,336] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +15: [2023-05-10 12:37:44,338] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +15: [2023-05-10 12:37:44,338] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +15: [2023-05-10 12:37:44,338] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +21: [2023-05-10 12:37:44,338] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +22: [2023-05-10 12:37:44,338] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +22: [2023-05-10 12:37:44,338] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +21: [2023-05-10 12:37:44,338] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +21: [2023-05-10 12:37:44,338] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +21: [2023-05-10 12:37:44,338] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +21: [2023-05-10 12:37:44,339] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +22: [2023-05-10 12:37:44,339] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +21: [2023-05-10 12:37:44,339] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +21: [2023-05-10 12:37:44,339] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +12: [2023-05-10 12:37:44,339] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +12: [2023-05-10 12:37:44,339] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +12: [2023-05-10 12:37:44,339] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +12: [2023-05-10 12:37:44,339] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... + 5: [2023-05-10 12:37:44,339] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +19: [2023-05-10 12:37:44,339] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +19: [2023-05-10 12:37:44,340] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +19: [2023-05-10 12:37:44,340] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +19: [2023-05-10 12:37:44,340] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +19: [2023-05-10 12:37:44,340] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +19: [2023-05-10 12:37:44,340] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +19: [2023-05-10 12:37:44,340] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +12: [2023-05-10 12:37:44,340] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +14: [2023-05-10 12:37:44,340] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +12: [2023-05-10 12:37:44,340] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +19: [2023-05-10 12:37:44,340] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt... +19: [2023-05-10 12:37:44,340] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +19: [2023-05-10 12:37:44,340] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt... +19: [2023-05-10 12:37:44,340] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt... +19: [2023-05-10 12:37:44,340] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... + 5: [2023-05-10 12:37:44,340] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... + 5: [2023-05-10 12:37:44,341] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +13: [2023-05-10 12:37:44,340] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +12: [2023-05-10 12:37:44,341] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +19: [2023-05-10 12:37:44,341] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +19: [2023-05-10 12:37:44,341] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +21: [2023-05-10 12:37:44,342] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +19: [2023-05-10 12:37:44,342] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +23: [2023-05-10 12:37:44,342] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +12: [2023-05-10 12:37:44,342] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... + 0: [2023-05-10 12:37:44,342] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. + 0: [2023-05-10 12:37:44,342] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +14: [2023-05-10 12:37:44,342] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +22: [2023-05-10 12:37:44,342] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... + 0: [2023-05-10 12:37:44,342] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. + 5: [2023-05-10 12:37:44,343] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... + 0: [2023-05-10 12:37:44,343] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. + 0: [2023-05-10 12:37:44,343] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. + 0: [2023-05-10 12:37:44,343] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... + 0: [2023-05-10 12:37:44,343] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +19: [2023-05-10 12:37:44,343] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt... +27: [2023-05-10 12:37:44,344] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +15: [2023-05-10 12:37:44,344] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +14: [2023-05-10 12:37:44,344] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +14: [2023-05-10 12:37:44,344] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +27: [2023-05-10 12:37:44,344] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. + 0: [2023-05-10 12:37:44,345] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +20: [2023-05-10 12:37:44,345] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +23: [2023-05-10 12:37:44,346] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +23: [2023-05-10 12:37:44,346] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +20: [2023-05-10 12:37:44,346] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +27: [2023-05-10 12:37:44,346] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +27: [2023-05-10 12:37:44,347] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +22: [2023-05-10 12:37:44,347] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... + 3: [2023-05-10 12:37:44,348] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. + 3: [2023-05-10 12:37:44,348] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... + 3: [2023-05-10 12:37:44,348] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. + 3: [2023-05-10 12:37:44,348] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. + 3: [2023-05-10 12:37:44,348] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... + 3: [2023-05-10 12:37:44,348] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +13: [2023-05-10 12:37:44,349] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +13: [2023-05-10 12:37:44,349] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +13: [2023-05-10 12:37:44,349] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +13: [2023-05-10 12:37:44,349] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +22: [2023-05-10 12:37:44,349] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +15: [2023-05-10 12:37:44,349] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... + 3: [2023-05-10 12:37:44,349] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +11: [2023-05-10 12:37:44,349] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +11: [2023-05-10 12:37:44,349] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +15: [2023-05-10 12:37:44,350] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +30: [2023-05-10 12:37:44,350] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +30: [2023-05-10 12:37:44,350] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +30: [2023-05-10 12:37:44,350] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +11: [2023-05-10 12:37:44,350] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +14: [2023-05-10 12:37:44,350] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +30: [2023-05-10 12:37:44,350] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +11: [2023-05-10 12:37:44,350] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +22: [2023-05-10 12:37:44,350] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... + 5: [2023-05-10 12:37:44,351] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. + 3: [2023-05-10 12:37:44,351] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +30: [2023-05-10 12:37:44,351] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +30: [2023-05-10 12:37:44,351] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. + 5: [2023-05-10 12:37:44,352] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt... +12: [2023-05-10 12:37:44,351] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +19: [2023-05-10 12:37:44,351] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +23: [2023-05-10 12:37:44,352] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +12: [2023-05-10 12:37:44,353] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +27: [2023-05-10 12:37:44,353] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +30: [2023-05-10 12:37:44,353] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +21: [2023-05-10 12:37:44,353] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +30: [2023-05-10 12:37:44,353] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +27: [2023-05-10 12:37:44,354] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +21: [2023-05-10 12:37:44,354] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +20: [2023-05-10 12:37:44,354] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... + 4: [2023-05-10 12:37:44,355] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. + 4: [2023-05-10 12:37:44,355] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +18: [2023-05-10 12:37:44,354] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +18: [2023-05-10 12:37:44,354] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +18: [2023-05-10 12:37:44,354] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +18: [2023-05-10 12:37:44,355] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +20: [2023-05-10 12:37:44,356] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... + 4: [2023-05-10 12:37:44,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +14: [2023-05-10 12:37:44,356] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +19: [2023-05-10 12:37:44,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +14: [2023-05-10 12:37:44,356] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +14: [2023-05-10 12:37:44,356] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +19: [2023-05-10 12:37:44,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +23: [2023-05-10 12:37:44,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +27: [2023-05-10 12:37:44,356] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... + 5: [2023-05-10 12:37:44,357] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. + 5: [2023-05-10 12:37:44,357] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt... + 4: [2023-05-10 12:37:44,357] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +13: [2023-05-10 12:37:44,358] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... + 4: [2023-05-10 12:37:44,358] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. + 4: [2023-05-10 12:37:44,358] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. + 4: [2023-05-10 12:37:44,358] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +27: [2023-05-10 12:37:44,359] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... + 3: [2023-05-10 12:37:44,359] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +11: [2023-05-10 12:37:44,359] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +11: [2023-05-10 12:37:44,359] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... + 4: [2023-05-10 12:37:44,360] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +13: [2023-05-10 12:37:44,360] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +13: [2023-05-10 12:37:44,360] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +19: [2023-05-10 12:37:44,360] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. + 7: [2023-05-10 12:37:44,360] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. + 7: [2023-05-10 12:37:44,360] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... + 5: [2023-05-10 12:37:44,361] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. + 7: [2023-05-10 12:37:44,361] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. + 7: [2023-05-10 12:37:44,361] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. + 7: [2023-05-10 12:37:44,361] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. + 7: [2023-05-10 12:37:44,361] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... + 5: [2023-05-10 12:37:44,361] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt... + 5: [2023-05-10 12:37:44,361] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +21: [2023-05-10 12:37:44,361] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. + 5: [2023-05-10 12:37:44,361] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt... +11: [2023-05-10 12:37:44,361] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +11: [2023-05-10 12:37:44,361] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +30: [2023-05-10 12:37:44,361] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +12: [2023-05-10 12:37:44,362] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +19: [2023-05-10 12:37:44,362] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +20: [2023-05-10 12:37:44,362] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +20: [2023-05-10 12:37:44,363] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. + 7: [2023-05-10 12:37:44,363] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... + 7: [2023-05-10 12:37:44,363] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +24: [2023-05-10 12:37:44,364] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +24: [2023-05-10 12:37:44,364] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +24: [2023-05-10 12:37:44,364] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +24: [2023-05-10 12:37:44,365] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +24: [2023-05-10 12:37:44,365] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +24: [2023-05-10 12:37:44,365] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +24: [2023-05-10 12:37:44,365] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. + 0: [2023-05-10 12:37:44,365] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +21: [2023-05-10 12:37:44,365] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +23: [2023-05-10 12:37:44,365] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +30: [2023-05-10 12:37:44,365] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt. +30: [2023-05-10 12:37:44,365] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt. +18: [2023-05-10 12:37:44,365] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +30: [2023-05-10 12:37:44,365] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt. +19: [2023-05-10 12:37:44,365] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +12: [2023-05-10 12:37:44,365] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +30: [2023-05-10 12:37:44,366] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt. +19: [2023-05-10 12:37:44,365] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... + 0: [2023-05-10 12:37:44,366] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. + 0: [2023-05-10 12:37:44,366] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +30: [2023-05-10 12:37:44,366] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +24: [2023-05-10 12:37:44,366] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... + 3: [2023-05-10 12:37:44,366] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. + 3: [2023-05-10 12:37:44,366] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +21: [2023-05-10 12:37:44,367] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +18: [2023-05-10 12:37:44,367] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +12: [2023-05-10 12:37:44,368] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +18: [2023-05-10 12:37:44,368] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +18: [2023-05-10 12:37:44,368] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +31: [2023-05-10 12:37:44,368] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. + 6: [2023-05-10 12:37:44,369] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. + 6: [2023-05-10 12:37:44,369] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. + 6: [2023-05-10 12:37:44,369] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. + 6: [2023-05-10 12:37:44,369] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... + 6: [2023-05-10 12:37:44,369] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... + 6: [2023-05-10 12:37:44,369] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +31: [2023-05-10 12:37:44,369] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +31: [2023-05-10 12:37:44,369] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. + 6: [2023-05-10 12:37:44,369] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +31: [2023-05-10 12:37:44,369] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +31: [2023-05-10 12:37:44,369] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +31: [2023-05-10 12:37:44,370] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. + 3: [2023-05-10 12:37:44,370] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +31: [2023-05-10 12:37:44,370] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +28: [2023-05-10 12:37:44,370] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +29: [2023-05-10 12:37:44,370] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +28: [2023-05-10 12:37:44,370] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +28: [2023-05-10 12:37:44,370] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +28: [2023-05-10 12:37:44,370] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +29: [2023-05-10 12:37:44,370] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +29: [2023-05-10 12:37:44,370] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +29: [2023-05-10 12:37:44,370] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. + 1: [2023-05-10 12:37:44,370] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +28: [2023-05-10 12:37:44,370] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +28: [2023-05-10 12:37:44,370] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +31: [2023-05-10 12:37:44,370] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +29: [2023-05-10 12:37:44,370] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +28: [2023-05-10 12:37:44,370] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +29: [2023-05-10 12:37:44,370] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. + 6: [2023-05-10 12:37:44,371] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +29: [2023-05-10 12:37:44,371] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... + 1: [2023-05-10 12:37:44,370] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +28: [2023-05-10 12:37:44,370] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... + 1: [2023-05-10 12:37:44,371] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. + 1: [2023-05-10 12:37:44,371] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... + 1: [2023-05-10 12:37:44,371] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +21: [2023-05-10 12:37:44,371] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... + 1: [2023-05-10 12:37:44,371] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. + 1: [2023-05-10 12:37:44,371] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +20: [2023-05-10 12:37:44,371] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... + 4: [2023-05-10 12:37:44,371] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +29: [2023-05-10 12:37:44,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +19: [2023-05-10 12:37:44,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +30: [2023-05-10 12:37:44,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... + 7: [2023-05-10 12:37:44,372] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. + 1: [2023-05-10 12:37:44,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +20: [2023-05-10 12:37:44,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... + 4: [2023-05-10 12:37:44,373] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +12: [2023-05-10 12:37:44,374] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +21: [2023-05-10 12:37:44,375] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +30: [2023-05-10 12:37:44,375] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +30: [2023-05-10 12:37:44,375] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +30: [2023-05-10 12:37:44,375] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... + 3: [2023-05-10 12:37:44,376] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... + 0: [2023-05-10 12:37:44,376] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... + 0: [2023-05-10 12:37:44,376] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... + 0: [2023-05-10 12:37:44,376] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +24: [2023-05-10 12:37:44,376] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +12: [2023-05-10 12:37:44,378] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... + 7: [2023-05-10 12:37:44,378] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +30: [2023-05-10 12:37:44,378] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... + 3: [2023-05-10 12:37:44,378] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +30: [2023-05-10 12:37:44,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +24: [2023-05-10 12:37:44,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +24: [2023-05-10 12:37:44,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. + 7: [2023-05-10 12:37:44,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +29: [2023-05-10 12:37:44,381] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +31: [2023-05-10 12:37:44,382] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +28: [2023-05-10 12:37:44,381] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. + 4: [2023-05-10 12:37:44,382] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... + 4: [2023-05-10 12:37:44,382] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. + 4: [2023-05-10 12:37:44,383] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +12: [2023-05-10 12:37:44,383] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +21: [2023-05-10 12:37:44,383] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... + 3: [2023-05-10 12:37:44,384] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +31: [2023-05-10 12:37:44,385] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +31: [2023-05-10 12:37:44,385] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +29: [2023-05-10 12:37:44,385] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. + 6: [2023-05-10 12:37:44,385] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. + 6: [2023-05-10 12:37:44,386] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. + 6: [2023-05-10 12:37:44,386] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. + 1: [2023-05-10 12:37:44,386] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. + 1: [2023-05-10 12:37:44,386] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +24: [2023-05-10 12:37:44,386] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... + 1: [2023-05-10 12:37:44,386] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +30: [2023-05-10 12:37:44,388] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +30: [2023-05-10 12:37:44,388] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt... + 4: [2023-05-10 12:37:44,389] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +24: [2023-05-10 12:37:44,389] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... + 0: [2023-05-10 12:37:44,390] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +24: [2023-05-10 12:37:44,390] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. + 7: [2023-05-10 12:37:44,390] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +30: [2023-05-10 12:37:44,390] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +30: [2023-05-10 12:37:44,390] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +28: [2023-05-10 12:37:44,390] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +28: [2023-05-10 12:37:44,390] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +28: [2023-05-10 12:37:44,390] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +28: [2023-05-10 12:37:44,391] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... + 4: [2023-05-10 12:37:44,391] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +31: [2023-05-10 12:37:44,391] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +24: [2023-05-10 12:37:44,392] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +29: [2023-05-10 12:37:44,392] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +29: [2023-05-10 12:37:44,393] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... + 3: [2023-05-10 12:37:44,393] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +31: [2023-05-10 12:37:44,393] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... + 7: [2023-05-10 12:37:44,393] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +30: [2023-05-10 12:37:44,393] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. + 7: [2023-05-10 12:37:44,394] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +30: [2023-05-10 12:37:44,394] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt... + 6: [2023-05-10 12:37:44,395] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +29: [2023-05-10 12:37:44,395] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +31: [2023-05-10 12:37:44,395] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +30: [2023-05-10 12:37:44,395] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +30: [2023-05-10 12:37:44,396] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt... + 1: [2023-05-10 12:37:44,396] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... + 6: [2023-05-10 12:37:44,396] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... + 6: [2023-05-10 12:37:44,397] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +29: [2023-05-10 12:37:44,397] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +31: [2023-05-10 12:37:44,397] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. + 4: [2023-05-10 12:37:44,397] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... + 6: [2023-05-10 12:37:44,398] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +16: [2023-05-10 12:37:44,398] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt. +24: [2023-05-10 12:37:44,398] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +16: [2023-05-10 12:37:44,398] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt. +16: [2023-05-10 12:37:44,398] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt. + 1: [2023-05-10 12:37:44,398] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +30: [2023-05-10 12:37:44,399] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +16: [2023-05-10 12:37:44,399] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt. + 0: [2023-05-10 12:37:44,399] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +28: [2023-05-10 12:37:44,399] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +30: [2023-05-10 12:37:44,399] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... + 1: [2023-05-10 12:37:44,400] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +29: [2023-05-10 12:37:44,400] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... + 1: [2023-05-10 12:37:44,400] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +28: [2023-05-10 12:37:44,402] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +28: [2023-05-10 12:37:44,402] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... + 7: [2023-05-10 12:37:44,403] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... + 7: [2023-05-10 12:37:44,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +31: [2023-05-10 12:37:44,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +30: [2023-05-10 12:37:44,406] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +29: [2023-05-10 12:37:44,406] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +16: [2023-05-10 12:37:44,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +16: [2023-05-10 12:37:44,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +30: [2023-05-10 12:37:44,408] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt... + 6: [2023-05-10 12:37:44,408] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +16: [2023-05-10 12:37:44,408] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +16: [2023-05-10 12:37:44,409] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... + 1: [2023-05-10 12:37:44,409] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... + 9: [2023-05-10 12:37:44,409] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. + 9: [2023-05-10 12:37:44,409] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. + 9: [2023-05-10 12:37:44,409] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... + 9: [2023-05-10 12:37:44,409] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. + 9: [2023-05-10 12:37:44,409] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. + 9: [2023-05-10 12:37:44,409] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... + 9: [2023-05-10 12:37:44,411] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... + 9: [2023-05-10 12:37:44,411] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +10: [2023-05-10 12:37:44,416] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +10: [2023-05-10 12:37:44,416] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +10: [2023-05-10 12:37:44,417] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +10: [2023-05-10 12:37:44,417] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +10: [2023-05-10 12:37:44,417] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +10: [2023-05-10 12:37:44,417] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +10: [2023-05-10 12:37:44,417] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +10: [2023-05-10 12:37:44,417] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... + 9: [2023-05-10 12:37:44,421] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +16: [2023-05-10 12:37:44,422] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +16: [2023-05-10 12:37:44,422] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +16: [2023-05-10 12:37:44,422] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt... +16: [2023-05-10 12:37:44,422] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt... +16: [2023-05-10 12:37:44,424] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +16: [2023-05-10 12:37:44,424] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt... +17: [2023-05-10 12:37:44,426] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +17: [2023-05-10 12:37:44,426] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +17: [2023-05-10 12:37:44,426] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +17: [2023-05-10 12:37:44,426] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +10: [2023-05-10 12:37:44,427] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. + 9: [2023-05-10 12:37:44,428] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +11: [2023-05-10 12:37:44,429] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt. +11: [2023-05-10 12:37:44,429] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt. +11: [2023-05-10 12:37:44,429] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt. +11: [2023-05-10 12:37:44,429] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt. +16: [2023-05-10 12:37:44,429] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +16: [2023-05-10 12:37:44,429] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt... +17: [2023-05-10 12:37:44,430] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +17: [2023-05-10 12:37:44,430] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. + 9: [2023-05-10 12:37:44,429] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +17: [2023-05-10 12:37:44,431] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +17: [2023-05-10 12:37:44,431] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... + 9: [2023-05-10 12:37:44,434] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +10: [2023-05-10 12:37:44,435] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +10: [2023-05-10 12:37:44,435] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. + 9: [2023-05-10 12:37:44,437] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +10: [2023-05-10 12:37:44,437] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +10: [2023-05-10 12:37:44,437] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +17: [2023-05-10 12:37:44,437] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. + 9: [2023-05-10 12:37:44,438] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +11: [2023-05-10 12:37:44,439] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +11: [2023-05-10 12:37:44,439] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +17: [2023-05-10 12:37:44,441] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +11: [2023-05-10 12:37:44,442] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +11: [2023-05-10 12:37:44,442] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... + 9: [2023-05-10 12:37:44,442] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +10: [2023-05-10 12:37:44,445] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... + 9: [2023-05-10 12:37:44,447] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +10: [2023-05-10 12:37:44,448] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +10: [2023-05-10 12:37:44,448] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +17: [2023-05-10 12:37:44,448] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +11: [2023-05-10 12:37:44,451] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +11: [2023-05-10 12:37:44,452] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +11: [2023-05-10 12:37:44,452] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt... +11: [2023-05-10 12:37:44,452] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt... +17: [2023-05-10 12:37:44,453] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... + 4: [2023-05-10 12:37:44,453] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt. + 4: [2023-05-10 12:37:44,453] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt. + 4: [2023-05-10 12:37:44,453] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt. +17: [2023-05-10 12:37:44,454] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. + 4: [2023-05-10 12:37:44,454] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt. +11: [2023-05-10 12:37:44,456] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +11: [2023-05-10 12:37:44,457] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt... +11: [2023-05-10 12:37:44,457] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +11: [2023-05-10 12:37:44,457] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt... +17: [2023-05-10 12:37:44,458] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. + 2: [2023-05-10 12:37:44,461] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. + 2: [2023-05-10 12:37:44,461] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. + 2: [2023-05-10 12:37:44,461] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... + 2: [2023-05-10 12:37:44,461] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... + 2: [2023-05-10 12:37:44,461] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. + 2: [2023-05-10 12:37:44,461] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... + 2: [2023-05-10 12:37:44,461] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. + 2: [2023-05-10 12:37:44,461] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +17: [2023-05-10 12:37:44,462] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +26: [2023-05-10 12:37:44,463] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +26: [2023-05-10 12:37:44,463] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +26: [2023-05-10 12:37:44,463] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +26: [2023-05-10 12:37:44,463] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +26: [2023-05-10 12:37:44,463] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +26: [2023-05-10 12:37:44,463] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +26: [2023-05-10 12:37:44,464] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. + 4: [2023-05-10 12:37:44,464] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +26: [2023-05-10 12:37:44,465] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... + 8: [2023-05-10 12:37:44,465] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. + 8: [2023-05-10 12:37:44,465] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. + 8: [2023-05-10 12:37:44,466] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... + 8: [2023-05-10 12:37:44,466] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... + 8: [2023-05-10 12:37:44,465] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. + 8: [2023-05-10 12:37:44,466] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... + 8: [2023-05-10 12:37:44,466] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. + 4: [2023-05-10 12:37:44,467] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... + 4: [2023-05-10 12:37:44,467] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... + 4: [2023-05-10 12:37:44,467] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +17: [2023-05-10 12:37:44,468] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... + 8: [2023-05-10 12:37:44,468] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... + 2: [2023-05-10 12:37:44,472] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. + 5: [2023-05-10 12:37:44,473] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. + 5: [2023-05-10 12:37:44,473] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... + 2: [2023-05-10 12:37:44,473] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. + 5: [2023-05-10 12:37:44,473] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. + 5: [2023-05-10 12:37:44,473] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +15: [2023-05-10 12:37:44,473] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +15: [2023-05-10 12:37:44,474] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +22: [2023-05-10 12:37:44,474] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt. +22: [2023-05-10 12:37:44,474] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt. +22: [2023-05-10 12:37:44,474] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt. +26: [2023-05-10 12:37:44,474] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. + 5: [2023-05-10 12:37:44,475] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. + 5: [2023-05-10 12:37:44,475] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +15: [2023-05-10 12:37:44,476] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +15: [2023-05-10 12:37:44,476] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... + 2: [2023-05-10 12:37:44,476] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. + 2: [2023-05-10 12:37:44,476] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. + 5: [2023-05-10 12:37:44,477] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... + 5: [2023-05-10 12:37:44,477] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +18: [2023-05-10 12:37:44,477] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt. +18: [2023-05-10 12:37:44,477] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt. +18: [2023-05-10 12:37:44,477] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt. +18: [2023-05-10 12:37:44,477] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt. + 4: [2023-05-10 12:37:44,479] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +26: [2023-05-10 12:37:44,479] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. + 4: [2023-05-10 12:37:44,480] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt... +26: [2023-05-10 12:37:44,481] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +15: [2023-05-10 12:37:44,480] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +15: [2023-05-10 12:37:44,480] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +15: [2023-05-10 12:37:44,481] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... + 4: [2023-05-10 12:37:44,481] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +22: [2023-05-10 12:37:44,481] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt. + 4: [2023-05-10 12:37:44,481] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt... +15: [2023-05-10 12:37:44,481] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... + 4: [2023-05-10 12:37:44,481] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. + 4: [2023-05-10 12:37:44,482] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt... + 2: [2023-05-10 12:37:44,482] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +25: [2023-05-10 12:37:44,483] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +25: [2023-05-10 12:37:44,483] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... + 2: [2023-05-10 12:37:44,483] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +26: [2023-05-10 12:37:44,483] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +22: [2023-05-10 12:37:44,483] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +25: [2023-05-10 12:37:44,483] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +22: [2023-05-10 12:37:44,484] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... + 8: [2023-05-10 12:37:44,485] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. + 8: [2023-05-10 12:37:44,485] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +25: [2023-05-10 12:37:44,485] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +22: [2023-05-10 12:37:44,485] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... + 5: [2023-05-10 12:37:44,485] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. + 2: [2023-05-10 12:37:44,486] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... + 5: [2023-05-10 12:37:44,487] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +18: [2023-05-10 12:37:44,487] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +18: [2023-05-10 12:37:44,487] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +25: [2023-05-10 12:37:44,487] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +25: [2023-05-10 12:37:44,487] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +25: [2023-05-10 12:37:44,487] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... + 2: [2023-05-10 12:37:44,487] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +18: [2023-05-10 12:37:44,487] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... + 8: [2023-05-10 12:37:44,488] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +15: [2023-05-10 12:37:44,488] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +15: [2023-05-10 12:37:44,488] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +25: [2023-05-10 12:37:44,489] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +26: [2023-05-10 12:37:44,489] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +20: [2023-05-10 12:37:44,490] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt. +22: [2023-05-10 12:37:44,490] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +20: [2023-05-10 12:37:44,490] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt. +20: [2023-05-10 12:37:44,490] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt. +26: [2023-05-10 12:37:44,491] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +20: [2023-05-10 12:37:44,491] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt. +22: [2023-05-10 12:37:44,491] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +22: [2023-05-10 12:37:44,491] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +22: [2023-05-10 12:37:44,491] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +22: [2023-05-10 12:37:44,491] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +22: [2023-05-10 12:37:44,492] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +22: [2023-05-10 12:37:44,493] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +18: [2023-05-10 12:37:44,493] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +26: [2023-05-10 12:37:44,493] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... + 8: [2023-05-10 12:37:44,494] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +22: [2023-05-10 12:37:44,494] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +22: [2023-05-10 12:37:44,495] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... + 8: [2023-05-10 12:37:44,495] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... + 5: [2023-05-10 12:37:44,495] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +25: [2023-05-10 12:37:44,496] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +22: [2023-05-10 12:37:44,496] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. + 4: [2023-05-10 12:37:44,496] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. + 5: [2023-05-10 12:37:44,497] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +22: [2023-05-10 12:37:44,497] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt... +15: [2023-05-10 12:37:44,497] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... + 8: [2023-05-10 12:37:44,497] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +26: [2023-05-10 12:37:44,498] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... + 4: [2023-05-10 12:37:44,498] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt... + 8: [2023-05-10 12:37:44,499] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +25: [2023-05-10 12:37:44,499] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +15: [2023-05-10 12:37:44,499] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +29: [2023-05-10 12:37:44,499] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt. +29: [2023-05-10 12:37:44,500] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt. +29: [2023-05-10 12:37:44,500] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt. +29: [2023-05-10 12:37:44,500] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt. +20: [2023-05-10 12:37:44,500] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +20: [2023-05-10 12:37:44,500] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +20: [2023-05-10 12:37:44,501] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +18: [2023-05-10 12:37:44,501] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +31: [2023-05-10 12:37:44,502] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt. +31: [2023-05-10 12:37:44,502] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt. +31: [2023-05-10 12:37:44,502] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt. +18: [2023-05-10 12:37:44,502] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt... +31: [2023-05-10 12:37:44,502] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt. +15: [2023-05-10 12:37:44,502] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +28: [2023-05-10 12:37:44,502] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt. +28: [2023-05-10 12:37:44,502] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt. +28: [2023-05-10 12:37:44,502] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt. +20: [2023-05-10 12:37:44,503] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +20: [2023-05-10 12:37:44,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +20: [2023-05-10 12:37:44,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +20: [2023-05-10 12:37:44,503] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +28: [2023-05-10 12:37:44,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt. +20: [2023-05-10 12:37:44,503] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +20: [2023-05-10 12:37:44,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +20: [2023-05-10 12:37:44,503] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +23: [2023-05-10 12:37:44,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +23: [2023-05-10 12:37:44,503] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +23: [2023-05-10 12:37:44,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +23: [2023-05-10 12:37:44,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +23: [2023-05-10 12:37:44,503] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +23: [2023-05-10 12:37:44,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +23: [2023-05-10 12:37:44,503] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +23: [2023-05-10 12:37:44,503] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +22: [2023-05-10 12:37:44,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +22: [2023-05-10 12:37:44,504] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt... + 9: [2023-05-10 12:37:44,504] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt. + 9: [2023-05-10 12:37:44,504] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt. +20: [2023-05-10 12:37:44,505] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. + 5: [2023-05-10 12:37:44,505] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +20: [2023-05-10 12:37:44,505] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +25: [2023-05-10 12:37:44,505] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... + 9: [2023-05-10 12:37:44,505] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt. + 9: [2023-05-10 12:37:44,506] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt. +19: [2023-05-10 12:37:44,506] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +19: [2023-05-10 12:37:44,506] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +19: [2023-05-10 12:37:44,506] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +19: [2023-05-10 12:37:44,506] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... + 8: [2023-05-10 12:37:44,504] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt. + 8: [2023-05-10 12:37:44,504] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt. +19: [2023-05-10 12:37:44,506] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... + 8: [2023-05-10 12:37:44,505] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt. + 8: [2023-05-10 12:37:44,505] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt. +18: [2023-05-10 12:37:44,506] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +18: [2023-05-10 12:37:44,506] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt... +16: [2023-05-10 12:37:44,507] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +16: [2023-05-10 12:37:44,507] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +16: [2023-05-10 12:37:44,507] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +16: [2023-05-10 12:37:44,507] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +19: [2023-05-10 12:37:44,508] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +19: [2023-05-10 12:37:44,508] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... + 5: [2023-05-10 12:37:44,508] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +11: [2023-05-10 12:37:44,508] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +11: [2023-05-10 12:37:44,508] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +11: [2023-05-10 12:37:44,508] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +11: [2023-05-10 12:37:44,508] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +15: [2023-05-10 12:37:44,508] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +24: [2023-05-10 12:37:44,507] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt. +24: [2023-05-10 12:37:44,507] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt. +24: [2023-05-10 12:37:44,507] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt. +24: [2023-05-10 12:37:44,507] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt. +22: [2023-05-10 12:37:44,508] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +14: [2023-05-10 12:37:44,508] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt. +22: [2023-05-10 12:37:44,508] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt... +25: [2023-05-10 12:37:44,508] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +14: [2023-05-10 12:37:44,508] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt. +14: [2023-05-10 12:37:44,508] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt. +12: [2023-05-10 12:37:44,509] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +29: [2023-05-10 12:37:44,509] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +14: [2023-05-10 12:37:44,509] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt. +12: [2023-05-10 12:37:44,509] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... + 8: [2023-05-10 12:37:44,509] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +22: [2023-05-10 12:37:44,509] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +22: [2023-05-10 12:37:44,509] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +29: [2023-05-10 12:37:44,509] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... + 3: [2023-05-10 12:37:44,509] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +19: [2023-05-10 12:37:44,510] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... + 6: [2023-05-10 12:37:44,509] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt. + 6: [2023-05-10 12:37:44,509] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt. + 6: [2023-05-10 12:37:44,510] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt. + 3: [2023-05-10 12:37:44,510] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +16: [2023-05-10 12:37:44,510] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. + 6: [2023-05-10 12:37:44,510] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt. +16: [2023-05-10 12:37:44,510] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +25: [2023-05-10 12:37:44,511] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +28: [2023-05-10 12:37:44,511] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... + 3: [2023-05-10 12:37:44,511] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. + 3: [2023-05-10 12:37:44,511] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +12: [2023-05-10 12:37:44,511] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +31: [2023-05-10 12:37:44,512] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +29: [2023-05-10 12:37:44,512] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +16: [2023-05-10 12:37:44,512] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +28: [2023-05-10 12:37:44,512] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +16: [2023-05-10 12:37:44,512] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +15: [2023-05-10 12:37:44,512] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +31: [2023-05-10 12:37:44,512] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +31: [2023-05-10 12:37:44,512] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +11: [2023-05-10 12:37:44,512] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +11: [2023-05-10 12:37:44,512] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +13: [2023-05-10 12:37:44,512] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +31: [2023-05-10 12:37:44,512] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +12: [2023-05-10 12:37:44,513] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +12: [2023-05-10 12:37:44,513] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +13: [2023-05-10 12:37:44,512] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +13: [2023-05-10 12:37:44,513] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +12: [2023-05-10 12:37:44,513] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +29: [2023-05-10 12:37:44,513] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +13: [2023-05-10 12:37:44,513] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +12: [2023-05-10 12:37:44,513] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... + 3: [2023-05-10 12:37:44,513] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. + 3: [2023-05-10 12:37:44,513] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +28: [2023-05-10 12:37:44,513] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +28: [2023-05-10 12:37:44,514] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... + 3: [2023-05-10 12:37:44,514] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. + 5: [2023-05-10 12:37:44,514] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +11: [2023-05-10 12:37:44,514] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +23: [2023-05-10 12:37:44,514] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. + 8: [2023-05-10 12:37:44,514] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +13: [2023-05-10 12:37:44,514] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +13: [2023-05-10 12:37:44,514] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +12: [2023-05-10 12:37:44,514] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... + 8: [2023-05-10 12:37:44,514] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... + 8: [2023-05-10 12:37:44,515] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +18: [2023-05-10 12:37:44,515] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +23: [2023-05-10 12:37:44,515] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +11: [2023-05-10 12:37:44,515] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... + 9: [2023-05-10 12:37:44,515] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +13: [2023-05-10 12:37:44,516] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +13: [2023-05-10 12:37:44,516] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... + 9: [2023-05-10 12:37:44,516] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +24: [2023-05-10 12:37:44,516] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... + 3: [2023-05-10 12:37:44,516] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +24: [2023-05-10 12:37:44,516] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +18: [2023-05-10 12:37:44,516] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt... + 8: [2023-05-10 12:37:44,516] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +23: [2023-05-10 12:37:44,516] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. + 1: [2023-05-10 12:37:44,517] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt. + 1: [2023-05-10 12:37:44,517] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt. +24: [2023-05-10 12:37:44,517] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... + 5: [2023-05-10 12:37:44,517] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +21: [2023-05-10 12:37:44,517] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +21: [2023-05-10 12:37:44,517] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +23: [2023-05-10 12:37:44,517] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. + 1: [2023-05-10 12:37:44,517] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt. +21: [2023-05-10 12:37:44,517] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +25: [2023-05-10 12:37:44,517] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. + 9: [2023-05-10 12:37:44,517] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +21: [2023-05-10 12:37:44,517] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... + 1: [2023-05-10 12:37:44,518] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt. + 9: [2023-05-10 12:37:44,518] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +24: [2023-05-10 12:37:44,518] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... + 7: [2023-05-10 12:37:44,518] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt. +14: [2023-05-10 12:37:44,518] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +19: [2023-05-10 12:37:44,517] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. + 7: [2023-05-10 12:37:44,518] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt. + 7: [2023-05-10 12:37:44,518] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt. +16: [2023-05-10 12:37:44,518] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. + 7: [2023-05-10 12:37:44,518] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt. +22: [2023-05-10 12:37:44,519] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +22: [2023-05-10 12:37:44,519] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... + 6: [2023-05-10 12:37:44,519] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... + 0: [2023-05-10 12:37:44,519] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. + 0: [2023-05-10 12:37:44,519] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. + 0: [2023-05-10 12:37:44,519] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. + 0: [2023-05-10 12:37:44,519] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... + 0: [2023-05-10 12:37:44,519] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... + 0: [2023-05-10 12:37:44,519] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... + 0: [2023-05-10 12:37:44,519] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. + 6: [2023-05-10 12:37:44,519] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... + 0: [2023-05-10 12:37:44,519] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... + 6: [2023-05-10 12:37:44,519] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +14: [2023-05-10 12:37:44,519] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +14: [2023-05-10 12:37:44,519] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +20: [2023-05-10 12:37:44,519] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +20: [2023-05-10 12:37:44,519] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +14: [2023-05-10 12:37:44,520] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +25: [2023-05-10 12:37:44,520] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... + 6: [2023-05-10 12:37:44,520] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +20: [2023-05-10 12:37:44,520] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt... +20: [2023-05-10 12:37:44,520] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt... +19: [2023-05-10 12:37:44,520] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +22: [2023-05-10 12:37:44,520] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +20: [2023-05-10 12:37:44,521] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +20: [2023-05-10 12:37:44,521] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt... +12: [2023-05-10 12:37:44,521] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +20: [2023-05-10 12:37:44,521] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +15: [2023-05-10 12:37:44,521] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... + 0: [2023-05-10 12:37:44,521] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt. + 0: [2023-05-10 12:37:44,522] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt. +21: [2023-05-10 12:37:44,522] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +21: [2023-05-10 12:37:44,522] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +22: [2023-05-10 12:37:44,522] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt... +11: [2023-05-10 12:37:44,523] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +11: [2023-05-10 12:37:44,523] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. + 0: [2023-05-10 12:37:44,523] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt. +22: [2023-05-10 12:37:44,523] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +23: [2023-05-10 12:37:44,523] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +13: [2023-05-10 12:37:44,523] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +20: [2023-05-10 12:37:44,523] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. + 0: [2023-05-10 12:37:44,523] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt. +21: [2023-05-10 12:37:44,524] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +21: [2023-05-10 12:37:44,524] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +28: [2023-05-10 12:37:44,524] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +28: [2023-05-10 12:37:44,525] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt... +29: [2023-05-10 12:37:44,525] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. + 3: [2023-05-10 12:37:44,525] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +25: [2023-05-10 12:37:44,526] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +12: [2023-05-10 12:37:44,526] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +29: [2023-05-10 12:37:44,526] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt... +16: [2023-05-10 12:37:44,526] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +16: [2023-05-10 12:37:44,527] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... + 1: [2023-05-10 12:37:44,527] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... + 1: [2023-05-10 12:37:44,527] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +23: [2023-05-10 12:37:44,527] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +23: [2023-05-10 12:37:44,527] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... + 7: [2023-05-10 12:37:44,527] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... + 7: [2023-05-10 12:37:44,528] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... + 9: [2023-05-10 12:37:44,528] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +24: [2023-05-10 12:37:44,528] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. + 9: [2023-05-10 12:37:44,528] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt... +28: [2023-05-10 12:37:44,528] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +28: [2023-05-10 12:37:44,528] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt... +24: [2023-05-10 12:37:44,529] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt... + 3: [2023-05-10 12:37:44,529] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. + 3: [2023-05-10 12:37:44,529] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. + 1: [2023-05-10 12:37:44,529] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +18: [2023-05-10 12:37:44,529] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. + 7: [2023-05-10 12:37:44,529] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +31: [2023-05-10 12:37:44,529] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +31: [2023-05-10 12:37:44,529] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. + 7: [2023-05-10 12:37:44,530] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +24: [2023-05-10 12:37:44,530] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +24: [2023-05-10 12:37:44,530] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt... +31: [2023-05-10 12:37:44,530] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt... +20: [2023-05-10 12:37:44,530] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +31: [2023-05-10 12:37:44,530] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt... +23: [2023-05-10 12:37:44,530] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... + 8: [2023-05-10 12:37:44,530] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +20: [2023-05-10 12:37:44,530] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +24: [2023-05-10 12:37:44,530] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +20: [2023-05-10 12:37:44,530] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +31: [2023-05-10 12:37:44,530] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +24: [2023-05-10 12:37:44,530] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt... +19: [2023-05-10 12:37:44,530] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +31: [2023-05-10 12:37:44,530] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt... +20: [2023-05-10 12:37:44,530] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt... + 8: [2023-05-10 12:37:44,530] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt... + 8: [2023-05-10 12:37:44,530] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +20: [2023-05-10 12:37:44,531] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. + 8: [2023-05-10 12:37:44,531] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt... +19: [2023-05-10 12:37:44,531] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... + 8: [2023-05-10 12:37:44,531] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +26: [2023-05-10 12:37:44,531] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt. + 6: [2023-05-10 12:37:44,531] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. + 8: [2023-05-10 12:37:44,531] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt... +26: [2023-05-10 12:37:44,531] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt. + 6: [2023-05-10 12:37:44,531] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt... +26: [2023-05-10 12:37:44,531] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt. +26: [2023-05-10 12:37:44,531] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt. +13: [2023-05-10 12:37:44,532] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +30: [2023-05-10 12:37:44,532] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +30: [2023-05-10 12:37:44,532] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +18: [2023-05-10 12:37:44,532] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +18: [2023-05-10 12:37:44,532] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +18: [2023-05-10 12:37:44,532] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +30: [2023-05-10 12:37:44,532] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +18: [2023-05-10 12:37:44,532] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt... +30: [2023-05-10 12:37:44,532] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +18: [2023-05-10 12:37:44,532] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +18: [2023-05-10 12:37:44,532] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +22: [2023-05-10 12:37:44,532] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +18: [2023-05-10 12:37:44,532] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +30: [2023-05-10 12:37:44,532] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +29: [2023-05-10 12:37:44,532] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +29: [2023-05-10 12:37:44,532] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt... +30: [2023-05-10 12:37:44,532] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +30: [2023-05-10 12:37:44,532] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +11: [2023-05-10 12:37:44,532] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +29: [2023-05-10 12:37:44,533] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. + 9: [2023-05-10 12:37:44,532] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +22: [2023-05-10 12:37:44,533] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +21: [2023-05-10 12:37:44,533] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +21: [2023-05-10 12:37:44,533] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +29: [2023-05-10 12:37:44,533] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +29: [2023-05-10 12:37:44,533] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt... + 9: [2023-05-10 12:37:44,533] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt... +12: [2023-05-10 12:37:44,533] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +29: [2023-05-10 12:37:44,533] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt... + 1: [2023-05-10 12:37:44,533] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +13: [2023-05-10 12:37:44,533] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +18: [2023-05-10 12:37:44,533] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. + 3: [2023-05-10 12:37:44,533] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +30: [2023-05-10 12:37:44,534] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +11: [2023-05-10 12:37:44,534] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +31: [2023-05-10 12:37:44,534] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +14: [2023-05-10 12:37:44,534] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. + 0: [2023-05-10 12:37:44,534] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... + 0: [2023-05-10 12:37:44,534] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +14: [2023-05-10 12:37:44,534] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +14: [2023-05-10 12:37:44,534] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +14: [2023-05-10 12:37:44,534] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +14: [2023-05-10 12:37:44,534] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +14: [2023-05-10 12:37:44,534] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +14: [2023-05-10 12:37:44,535] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt... +31: [2023-05-10 12:37:44,535] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt... +12: [2023-05-10 12:37:44,535] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +20: [2023-05-10 12:37:44,536] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +14: [2023-05-10 12:37:44,536] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +28: [2023-05-10 12:37:44,536] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +16: [2023-05-10 12:37:44,536] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +14: [2023-05-10 12:37:44,536] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +18: [2023-05-10 12:37:44,536] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +14: [2023-05-10 12:37:44,537] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... + 6: [2023-05-10 12:37:44,537] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. + 6: [2023-05-10 12:37:44,537] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt... +28: [2023-05-10 12:37:44,537] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt... +12: [2023-05-10 12:37:44,537] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. + 9: [2023-05-10 12:37:44,538] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +19: [2023-05-10 12:37:44,538] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. + 9: [2023-05-10 12:37:44,538] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt... +11: [2023-05-10 12:37:44,538] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. + 0: [2023-05-10 12:37:44,538] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +19: [2023-05-10 12:37:44,538] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. + 0: [2023-05-10 12:37:44,539] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... + 3: [2023-05-10 12:37:44,539] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... + 3: [2023-05-10 12:37:44,539] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +14: [2023-05-10 12:37:44,539] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +14: [2023-05-10 12:37:44,539] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt... + 7: [2023-05-10 12:37:44,539] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. + 3: [2023-05-10 12:37:44,540] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt. + 3: [2023-05-10 12:37:44,540] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt. + 3: [2023-05-10 12:37:44,540] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt. +20: [2023-05-10 12:37:44,540] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... + 3: [2023-05-10 12:37:44,540] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt. +28: [2023-05-10 12:37:44,540] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +12: [2023-05-10 12:37:44,540] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. + 7: [2023-05-10 12:37:44,540] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt... +20: [2023-05-10 12:37:44,541] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +22: [2023-05-10 12:37:44,541] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +26: [2023-05-10 12:37:44,541] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +26: [2023-05-10 12:37:44,541] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... + 8: [2023-05-10 12:37:44,541] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. + 7: [2023-05-10 12:37:44,541] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +28: [2023-05-10 12:37:44,542] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt... + 7: [2023-05-10 12:37:44,542] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt... +16: [2023-05-10 12:37:44,542] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +13: [2023-05-10 12:37:44,542] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +14: [2023-05-10 12:37:44,542] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +14: [2023-05-10 12:37:44,542] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt... + 8: [2023-05-10 12:37:44,542] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt... + 6: [2023-05-10 12:37:44,542] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. + 6: [2023-05-10 12:37:44,542] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt... + 6: [2023-05-10 12:37:44,542] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. + 6: [2023-05-10 12:37:44,542] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt... +16: [2023-05-10 12:37:44,543] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +21: [2023-05-10 12:37:44,543] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +21: [2023-05-10 12:37:44,544] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... + 1: [2023-05-10 12:37:44,543] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +26: [2023-05-10 12:37:44,544] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... + 9: [2023-05-10 12:37:44,544] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. + 1: [2023-05-10 12:37:44,544] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt... + 1: [2023-05-10 12:37:44,544] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. + 1: [2023-05-10 12:37:44,544] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +30: [2023-05-10 12:37:44,544] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. + 1: [2023-05-10 12:37:44,545] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt... +26: [2023-05-10 12:37:44,545] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... + 9: [2023-05-10 12:37:44,545] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt... +24: [2023-05-10 12:37:44,545] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. + 1: [2023-05-10 12:37:44,546] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt... +21: [2023-05-10 12:37:44,546] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt. +21: [2023-05-10 12:37:44,546] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt. +21: [2023-05-10 12:37:44,546] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt. +12: [2023-05-10 12:37:44,546] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +24: [2023-05-10 12:37:44,546] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt... +21: [2023-05-10 12:37:44,547] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt. +19: [2023-05-10 12:37:44,547] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... + 7: [2023-05-10 12:37:44,547] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. + 7: [2023-05-10 12:37:44,547] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt... +13: [2023-05-10 12:37:44,547] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +13: [2023-05-10 12:37:44,548] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +11: [2023-05-10 12:37:44,548] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +19: [2023-05-10 12:37:44,548] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +11: [2023-05-10 12:37:44,548] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +21: [2023-05-10 12:37:44,549] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +14: [2023-05-10 12:37:44,549] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +14: [2023-05-10 12:37:44,549] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. + 3: [2023-05-10 12:37:44,549] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +30: [2023-05-10 12:37:44,550] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +30: [2023-05-10 12:37:44,550] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. + 3: [2023-05-10 12:37:44,550] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... + 3: [2023-05-10 12:37:44,550] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... + 3: [2023-05-10 12:37:44,550] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +12: [2023-05-10 12:37:44,551] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +14: [2023-05-10 12:37:44,550] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt... +16: [2023-05-10 12:37:44,552] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... + 0: [2023-05-10 12:37:44,552] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +16: [2023-05-10 12:37:44,552] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... + 0: [2023-05-10 12:37:44,552] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt... + 3: [2023-05-10 12:37:44,553] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. + 0: [2023-05-10 12:37:44,554] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. + 0: [2023-05-10 12:37:44,554] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt... +15: [2023-05-10 12:37:44,555] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt. +15: [2023-05-10 12:37:44,555] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt. +15: [2023-05-10 12:37:44,555] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt. +15: [2023-05-10 12:37:44,555] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt. +21: [2023-05-10 12:37:44,555] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +30: [2023-05-10 12:37:44,556] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +21: [2023-05-10 12:37:44,556] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +13: [2023-05-10 12:37:44,556] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +13: [2023-05-10 12:37:44,557] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +21: [2023-05-10 12:37:44,557] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +11: [2023-05-10 12:37:44,557] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +21: [2023-05-10 12:37:44,558] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +19: [2023-05-10 12:37:44,558] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt. +19: [2023-05-10 12:37:44,558] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt. +19: [2023-05-10 12:37:44,558] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt. +19: [2023-05-10 12:37:44,559] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt. +30: [2023-05-10 12:37:44,559] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +21: [2023-05-10 12:37:44,559] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +10: [2023-05-10 12:37:44,559] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt. +10: [2023-05-10 12:37:44,559] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt. +14: [2023-05-10 12:37:44,560] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +21: [2023-05-10 12:37:44,560] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +10: [2023-05-10 12:37:44,560] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt. +30: [2023-05-10 12:37:44,561] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... + 1: [2023-05-10 12:37:44,561] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +10: [2023-05-10 12:37:44,561] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt. +18: [2023-05-10 12:37:44,561] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +18: [2023-05-10 12:37:44,561] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +18: [2023-05-10 12:37:44,561] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +14: [2023-05-10 12:37:44,561] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +26: [2023-05-10 12:37:44,562] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. + 3: [2023-05-10 12:37:44,562] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. + 1: [2023-05-10 12:37:44,563] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt... + 7: [2023-05-10 12:37:44,562] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +26: [2023-05-10 12:37:44,563] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt... +26: [2023-05-10 12:37:44,563] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +14: [2023-05-10 12:37:44,563] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +26: [2023-05-10 12:37:44,563] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt... + 3: [2023-05-10 12:37:44,563] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt... + 3: [2023-05-10 12:37:44,563] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +30: [2023-05-10 12:37:44,564] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. + 0: [2023-05-10 12:37:44,564] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. + 0: [2023-05-10 12:37:44,564] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. + 0: [2023-05-10 12:37:44,564] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. + 0: [2023-05-10 12:37:44,564] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +26: [2023-05-10 12:37:44,565] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. + 7: [2023-05-10 12:37:44,565] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt... + 5: [2023-05-10 12:37:44,566] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt. + 5: [2023-05-10 12:37:44,566] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt. + 5: [2023-05-10 12:37:44,566] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt. + 5: [2023-05-10 12:37:44,566] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt. +26: [2023-05-10 12:37:44,566] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt... + 3: [2023-05-10 12:37:44,566] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. + 3: [2023-05-10 12:37:44,566] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. + 3: [2023-05-10 12:37:44,567] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt... + 3: [2023-05-10 12:37:44,567] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt... +15: [2023-05-10 12:37:44,565] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +15: [2023-05-10 12:37:44,566] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +14: [2023-05-10 12:37:44,567] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +10: [2023-05-10 12:37:44,568] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +15: [2023-05-10 12:37:44,569] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +15: [2023-05-10 12:37:44,569] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +21: [2023-05-10 12:37:44,569] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +19: [2023-05-10 12:37:44,569] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +19: [2023-05-10 12:37:44,569] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +30: [2023-05-10 12:37:44,569] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt. +30: [2023-05-10 12:37:44,569] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt. +30: [2023-05-10 12:37:44,569] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt. +30: [2023-05-10 12:37:44,570] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt. +10: [2023-05-10 12:37:44,570] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +10: [2023-05-10 12:37:44,571] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +10: [2023-05-10 12:37:44,571] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +14: [2023-05-10 12:37:44,571] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +18: [2023-05-10 12:37:44,572] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +18: [2023-05-10 12:37:44,572] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +18: [2023-05-10 12:37:44,572] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +14: [2023-05-10 12:37:44,572] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +26: [2023-05-10 12:37:44,573] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +30: [2023-05-10 12:37:44,573] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +19: [2023-05-10 12:37:44,574] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +19: [2023-05-10 12:37:44,574] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +16: [2023-05-10 12:37:44,574] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt. +16: [2023-05-10 12:37:44,574] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt. +16: [2023-05-10 12:37:44,574] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt. +16: [2023-05-10 12:37:44,574] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt. +26: [2023-05-10 12:37:44,575] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt... + 5: [2023-05-10 12:37:44,575] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... + 1: [2023-05-10 12:37:44,576] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. + 1: [2023-05-10 12:37:44,576] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. + 1: [2023-05-10 12:37:44,576] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. + 1: [2023-05-10 12:37:44,576] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... + 1: [2023-05-10 12:37:44,576] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... + 1: [2023-05-10 12:37:44,576] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... + 1: [2023-05-10 12:37:44,576] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. + 1: [2023-05-10 12:37:44,576] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... + 5: [2023-05-10 12:37:44,576] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... + 5: [2023-05-10 12:37:44,576] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +14: [2023-05-10 12:37:44,576] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +21: [2023-05-10 12:37:44,576] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +21: [2023-05-10 12:37:44,577] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +21: [2023-05-10 12:37:44,577] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +21: [2023-05-10 12:37:44,577] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +21: [2023-05-10 12:37:44,577] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt... +21: [2023-05-10 12:37:44,577] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt... +21: [2023-05-10 12:37:44,577] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt... +21: [2023-05-10 12:37:44,577] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt... + 3: [2023-05-10 12:37:44,577] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. + 5: [2023-05-10 12:37:44,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... + 0: [2023-05-10 12:37:44,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... + 0: [2023-05-10 12:37:44,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... + 3: [2023-05-10 12:37:44,579] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt... +15: [2023-05-10 12:37:44,579] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +30: [2023-05-10 12:37:44,579] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +30: [2023-05-10 12:37:44,579] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +29: [2023-05-10 12:37:44,579] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +29: [2023-05-10 12:37:44,580] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... + 0: [2023-05-10 12:37:44,580] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. + 0: [2023-05-10 12:37:44,580] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt... +15: [2023-05-10 12:37:44,579] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt... +30: [2023-05-10 12:37:44,580] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... + 0: [2023-05-10 12:37:44,580] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +29: [2023-05-10 12:37:44,581] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. + 0: [2023-05-10 12:37:44,581] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +30: [2023-05-10 12:37:44,581] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +18: [2023-05-10 12:37:44,582] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +29: [2023-05-10 12:37:44,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... + 0: [2023-05-10 12:37:44,582] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. + 0: [2023-05-10 12:37:44,583] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt... +29: [2023-05-10 12:37:44,583] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +29: [2023-05-10 12:37:44,583] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +16: [2023-05-10 12:37:44,583] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +17: [2023-05-10 12:37:44,583] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt. +17: [2023-05-10 12:37:44,583] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt. +16: [2023-05-10 12:37:44,583] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +29: [2023-05-10 12:37:44,583] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +17: [2023-05-10 12:37:44,583] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt. +17: [2023-05-10 12:37:44,583] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt. +10: [2023-05-10 12:37:44,583] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +10: [2023-05-10 12:37:44,584] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt... +16: [2023-05-10 12:37:44,584] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +15: [2023-05-10 12:37:44,584] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +29: [2023-05-10 12:37:44,584] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +15: [2023-05-10 12:37:44,584] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt... +16: [2023-05-10 12:37:44,585] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +12: [2023-05-10 12:37:44,585] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt. +12: [2023-05-10 12:37:44,585] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt. +12: [2023-05-10 12:37:44,585] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt. +10: [2023-05-10 12:37:44,585] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +10: [2023-05-10 12:37:44,585] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt... +12: [2023-05-10 12:37:44,585] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt. +10: [2023-05-10 12:37:44,585] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +10: [2023-05-10 12:37:44,586] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt... +10: [2023-05-10 12:37:44,586] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +10: [2023-05-10 12:37:44,586] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt... +19: [2023-05-10 12:37:44,589] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +19: [2023-05-10 12:37:44,590] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt... +18: [2023-05-10 12:37:44,591] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +15: [2023-05-10 12:37:44,591] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +15: [2023-05-10 12:37:44,591] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt... + 1: [2023-05-10 12:37:44,591] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. + 1: [2023-05-10 12:37:44,591] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +19: [2023-05-10 12:37:44,592] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +19: [2023-05-10 12:37:44,592] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt... +29: [2023-05-10 12:37:44,592] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. + 1: [2023-05-10 12:37:44,592] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. + 1: [2023-05-10 12:37:44,592] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +11: [2023-05-10 12:37:44,592] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt. +11: [2023-05-10 12:37:44,592] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt. +11: [2023-05-10 12:37:44,592] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt. +11: [2023-05-10 12:37:44,592] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt. +17: [2023-05-10 12:37:44,593] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +19: [2023-05-10 12:37:44,593] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +17: [2023-05-10 12:37:44,593] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +17: [2023-05-10 12:37:44,593] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... + 5: [2023-05-10 12:37:44,594] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +12: [2023-05-10 12:37:44,594] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +19: [2023-05-10 12:37:44,594] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt... + 5: [2023-05-10 12:37:44,594] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. + 5: [2023-05-10 12:37:44,595] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +29: [2023-05-10 12:37:44,595] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +15: [2023-05-10 12:37:44,595] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. + 5: [2023-05-10 12:37:44,595] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt... + 5: [2023-05-10 12:37:44,595] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt... + 5: [2023-05-10 12:37:44,595] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt... +12: [2023-05-10 12:37:44,595] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +12: [2023-05-10 12:37:44,595] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +17: [2023-05-10 12:37:44,596] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +30: [2023-05-10 12:37:44,596] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +30: [2023-05-10 12:37:44,596] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +27: [2023-05-10 12:37:44,597] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt. +30: [2023-05-10 12:37:44,597] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt... +30: [2023-05-10 12:37:44,597] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt... +15: [2023-05-10 12:37:44,597] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt... +27: [2023-05-10 12:37:44,597] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt. + 2: [2023-05-10 12:37:44,598] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt. + 2: [2023-05-10 12:37:44,598] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt. + 2: [2023-05-10 12:37:44,598] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt. +12: [2023-05-10 12:37:44,598] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... + 2: [2023-05-10 12:37:44,598] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt. +30: [2023-05-10 12:37:44,598] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +30: [2023-05-10 12:37:44,598] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt... + 5: [2023-05-10 12:37:44,598] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. + 5: [2023-05-10 12:37:44,598] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt... +27: [2023-05-10 12:37:44,598] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt. +27: [2023-05-10 12:37:44,599] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +27: [2023-05-10 12:37:44,599] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +27: [2023-05-10 12:37:44,599] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +27: [2023-05-10 12:37:44,599] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +27: [2023-05-10 12:37:44,599] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +27: [2023-05-10 12:37:44,599] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt. +16: [2023-05-10 12:37:44,599] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +16: [2023-05-10 12:37:44,599] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +16: [2023-05-10 12:37:44,599] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +27: [2023-05-10 12:37:44,599] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +27: [2023-05-10 12:37:44,600] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +16: [2023-05-10 12:37:44,600] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt... +16: [2023-05-10 12:37:44,600] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt... +16: [2023-05-10 12:37:44,600] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt... +19: [2023-05-10 12:37:44,599] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +27: [2023-05-10 12:37:44,600] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... + 1: [2023-05-10 12:37:44,601] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... + 1: [2023-05-10 12:37:44,601] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +19: [2023-05-10 12:37:44,601] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt... + 1: [2023-05-10 12:37:44,601] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... + 1: [2023-05-10 12:37:44,601] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +25: [2023-05-10 12:37:44,601] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt. +11: [2023-05-10 12:37:44,601] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +25: [2023-05-10 12:37:44,602] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt. +30: [2023-05-10 12:37:44,602] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +25: [2023-05-10 12:37:44,602] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt. +30: [2023-05-10 12:37:44,602] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt... +25: [2023-05-10 12:37:44,602] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt. +11: [2023-05-10 12:37:44,602] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +11: [2023-05-10 12:37:44,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +11: [2023-05-10 12:37:44,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +13: [2023-05-10 12:37:44,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt. +13: [2023-05-10 12:37:44,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt. +13: [2023-05-10 12:37:44,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt. +13: [2023-05-10 12:37:44,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt. +29: [2023-05-10 12:37:44,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +29: [2023-05-10 12:37:44,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +29: [2023-05-10 12:37:44,607] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +29: [2023-05-10 12:37:44,608] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +12: [2023-05-10 12:37:44,608] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +27: [2023-05-10 12:37:44,608] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... + 4: [2023-05-10 12:37:44,609] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt. +12: [2023-05-10 12:37:44,609] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt... +22: [2023-05-10 12:37:44,609] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt. +22: [2023-05-10 12:37:44,609] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt. +22: [2023-05-10 12:37:44,609] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt. +16: [2023-05-10 12:37:44,609] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. + 4: [2023-05-10 12:37:44,609] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt. + 4: [2023-05-10 12:37:44,609] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt. +22: [2023-05-10 12:37:44,609] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt. +17: [2023-05-10 12:37:44,610] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. + 4: [2023-05-10 12:37:44,610] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt. +17: [2023-05-10 12:37:44,610] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +16: [2023-05-10 12:37:44,610] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt... +17: [2023-05-10 12:37:44,610] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt... +27: [2023-05-10 12:37:44,611] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +25: [2023-05-10 12:37:44,611] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +17: [2023-05-10 12:37:44,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +17: [2023-05-10 12:37:44,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt... +17: [2023-05-10 12:37:44,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt... +13: [2023-05-10 12:37:44,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +25: [2023-05-10 12:37:44,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +27: [2023-05-10 12:37:44,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +27: [2023-05-10 12:37:44,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... + 2: [2023-05-10 12:37:44,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... + 2: [2023-05-10 12:37:44,613] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +13: [2023-05-10 12:37:44,613] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +13: [2023-05-10 12:37:44,613] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +12: [2023-05-10 12:37:44,613] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +25: [2023-05-10 12:37:44,613] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +12: [2023-05-10 12:37:44,613] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt... + 2: [2023-05-10 12:37:44,613] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... + 2: [2023-05-10 12:37:44,613] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +25: [2023-05-10 12:37:44,614] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +13: [2023-05-10 12:37:44,614] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +27: [2023-05-10 12:37:44,615] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +11: [2023-05-10 12:37:44,615] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +11: [2023-05-10 12:37:44,616] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt... +29: [2023-05-10 12:37:44,616] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +11: [2023-05-10 12:37:44,616] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +11: [2023-05-10 12:37:44,616] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt... +27: [2023-05-10 12:37:44,617] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +29: [2023-05-10 12:37:44,617] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +11: [2023-05-10 12:37:44,617] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +11: [2023-05-10 12:37:44,617] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt... +12: [2023-05-10 12:37:44,619] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +11: [2023-05-10 12:37:44,619] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +22: [2023-05-10 12:37:44,619] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +12: [2023-05-10 12:37:44,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt... +11: [2023-05-10 12:37:44,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt... + 4: [2023-05-10 12:37:44,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... + 4: [2023-05-10 12:37:44,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +27: [2023-05-10 12:37:44,620] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +12: [2023-05-10 12:37:44,621] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +22: [2023-05-10 12:37:44,621] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +22: [2023-05-10 12:37:44,621] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +22: [2023-05-10 12:37:44,622] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... + 4: [2023-05-10 12:37:44,622] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... + 4: [2023-05-10 12:37:44,622] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +12: [2023-05-10 12:37:44,623] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt... +13: [2023-05-10 12:37:44,623] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +13: [2023-05-10 12:37:44,624] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt... +27: [2023-05-10 12:37:44,625] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +25: [2023-05-10 12:37:44,625] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +25: [2023-05-10 12:37:44,627] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt... + 2: [2023-05-10 12:37:44,627] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +17: [2023-05-10 12:37:44,627] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +27: [2023-05-10 12:37:44,627] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... + 2: [2023-05-10 12:37:44,627] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt... +18: [2023-05-10 12:37:44,628] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt. +18: [2023-05-10 12:37:44,628] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt. +18: [2023-05-10 12:37:44,628] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt. +18: [2023-05-10 12:37:44,628] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt. +13: [2023-05-10 12:37:44,629] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +17: [2023-05-10 12:37:44,629] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt... +20: [2023-05-10 12:37:44,630] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt. +20: [2023-05-10 12:37:44,630] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt. +20: [2023-05-10 12:37:44,630] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt. +20: [2023-05-10 12:37:44,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt. +13: [2023-05-10 12:37:44,631] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt... +27: [2023-05-10 12:37:44,631] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +27: [2023-05-10 12:37:44,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +27: [2023-05-10 12:37:44,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +27: [2023-05-10 12:37:44,632] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt... + 2: [2023-05-10 12:37:44,632] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. + 2: [2023-05-10 12:37:44,632] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt... + 9: [2023-05-10 12:37:44,633] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt. +27: [2023-05-10 12:37:44,633] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. + 9: [2023-05-10 12:37:44,633] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt. + 9: [2023-05-10 12:37:44,633] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt. +13: [2023-05-10 12:37:44,633] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +27: [2023-05-10 12:37:44,633] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt... +13: [2023-05-10 12:37:44,633] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt... + 9: [2023-05-10 12:37:44,633] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt. + 4: [2023-05-10 12:37:44,635] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. + 4: [2023-05-10 12:37:44,635] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt... +25: [2023-05-10 12:37:44,636] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +25: [2023-05-10 12:37:44,637] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +25: [2023-05-10 12:37:44,637] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +18: [2023-05-10 12:37:44,637] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +27: [2023-05-10 12:37:44,637] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +27: [2023-05-10 12:37:44,637] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt... +25: [2023-05-10 12:37:44,638] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt... +25: [2023-05-10 12:37:44,638] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt... + 4: [2023-05-10 12:37:44,638] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. + 4: [2023-05-10 12:37:44,638] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt... +25: [2023-05-10 12:37:44,638] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt... + 2: [2023-05-10 12:37:44,639] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. + 2: [2023-05-10 12:37:44,639] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +18: [2023-05-10 12:37:44,639] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +18: [2023-05-10 12:37:44,639] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +18: [2023-05-10 12:37:44,639] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +27: [2023-05-10 12:37:44,640] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +22: [2023-05-10 12:37:44,639] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +20: [2023-05-10 12:37:44,640] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +20: [2023-05-10 12:37:44,640] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... + 2: [2023-05-10 12:37:44,641] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt... +27: [2023-05-10 12:37:44,641] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +20: [2023-05-10 12:37:44,641] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... + 2: [2023-05-10 12:37:44,641] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt... +13: [2023-05-10 12:37:44,641] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. + 4: [2023-05-10 12:37:44,642] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. + 4: [2023-05-10 12:37:44,642] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +22: [2023-05-10 12:37:44,642] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt... +20: [2023-05-10 12:37:44,642] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... + 4: [2023-05-10 12:37:44,642] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. + 4: [2023-05-10 12:37:44,642] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... + 4: [2023-05-10 12:37:44,642] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... + 4: [2023-05-10 12:37:44,642] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. + 4: [2023-05-10 12:37:44,642] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... + 4: [2023-05-10 12:37:44,642] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +27: [2023-05-10 12:37:44,642] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt... +13: [2023-05-10 12:37:44,643] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt... + 4: [2023-05-10 12:37:44,644] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. + 4: [2023-05-10 12:37:44,644] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt... +22: [2023-05-10 12:37:44,644] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +22: [2023-05-10 12:37:44,644] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt... + 6: [2023-05-10 12:37:44,644] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. + 6: [2023-05-10 12:37:44,644] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. + 6: [2023-05-10 12:37:44,644] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. + 6: [2023-05-10 12:37:44,644] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... + 6: [2023-05-10 12:37:44,644] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. + 6: [2023-05-10 12:37:44,645] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +22: [2023-05-10 12:37:44,645] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. + 6: [2023-05-10 12:37:44,646] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... + 6: [2023-05-10 12:37:44,646] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... + 9: [2023-05-10 12:37:44,646] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +22: [2023-05-10 12:37:44,646] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt... +23: [2023-05-10 12:37:44,648] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt. +23: [2023-05-10 12:37:44,648] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt. +23: [2023-05-10 12:37:44,648] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt. +23: [2023-05-10 12:37:44,648] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_22-model_01-model_states.pt. + 4: [2023-05-10 12:37:44,648] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. + 9: [2023-05-10 12:37:44,649] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... + 9: [2023-05-10 12:37:44,649] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... + 9: [2023-05-10 12:37:44,649] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... + 4: [2023-05-10 12:37:44,649] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt... +22: [2023-05-10 12:37:44,650] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +22: [2023-05-10 12:37:44,651] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt... +20: [2023-05-10 12:37:44,652] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +20: [2023-05-10 12:37:44,653] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt... +20: [2023-05-10 12:37:44,654] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +20: [2023-05-10 12:37:44,654] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt... +18: [2023-05-10 12:37:44,654] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +18: [2023-05-10 12:37:44,654] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +18: [2023-05-10 12:37:44,655] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt... +18: [2023-05-10 12:37:44,655] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt... + 4: [2023-05-10 12:37:44,654] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +18: [2023-05-10 12:37:44,656] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +18: [2023-05-10 12:37:44,656] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt... +20: [2023-05-10 12:37:44,656] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +23: [2023-05-10 12:37:44,657] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +23: [2023-05-10 12:37:44,657] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... + 0: [2023-05-10 12:37:44,657] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt. + 0: [2023-05-10 12:37:44,657] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt. +31: [2023-05-10 12:37:44,657] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt. +31: [2023-05-10 12:37:44,657] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt. +31: [2023-05-10 12:37:44,657] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt. + 0: [2023-05-10 12:37:44,657] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt. + 0: [2023-05-10 12:37:44,657] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt. +31: [2023-05-10 12:37:44,657] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt. +20: [2023-05-10 12:37:44,657] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt... + 7: [2023-05-10 12:37:44,657] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. + 7: [2023-05-10 12:37:44,658] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. + 7: [2023-05-10 12:37:44,658] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. + 7: [2023-05-10 12:37:44,658] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... + 7: [2023-05-10 12:37:44,658] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... + 7: [2023-05-10 12:37:44,658] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... + 3: [2023-05-10 12:37:44,658] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt. + 3: [2023-05-10 12:37:44,658] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt. + 3: [2023-05-10 12:37:44,658] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt. + 3: [2023-05-10 12:37:44,658] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt. + 6: [2023-05-10 12:37:44,659] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. + 7: [2023-05-10 12:37:44,659] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. + 7: [2023-05-10 12:37:44,659] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... + 6: [2023-05-10 12:37:44,660] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. + 4: [2023-05-10 12:37:44,660] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +23: [2023-05-10 12:37:44,660] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... +23: [2023-05-10 12:37:44,660] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt... + 4: [2023-05-10 12:37:44,661] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. + 4: [2023-05-10 12:37:44,661] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +18: [2023-05-10 12:37:44,661] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +18: [2023-05-10 12:37:44,662] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt... + 9: [2023-05-10 12:37:44,663] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. + 9: [2023-05-10 12:37:44,664] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt... + 4: [2023-05-10 12:37:44,664] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... + 7: [2023-05-10 12:37:44,665] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt. + 7: [2023-05-10 12:37:44,665] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt. +20: [2023-05-10 12:37:44,665] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. + 7: [2023-05-10 12:37:44,665] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt. + 9: [2023-05-10 12:37:44,665] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. + 9: [2023-05-10 12:37:44,666] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt... + 0: [2023-05-10 12:37:44,667] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +31: [2023-05-10 12:37:44,667] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... + 0: [2023-05-10 12:37:44,667] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +20: [2023-05-10 12:37:44,667] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt... + 7: [2023-05-10 12:37:44,666] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt. + 3: [2023-05-10 12:37:44,667] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +31: [2023-05-10 12:37:44,667] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... + 3: [2023-05-10 12:37:44,667] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... + 0: [2023-05-10 12:37:44,668] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +31: [2023-05-10 12:37:44,668] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... + 3: [2023-05-10 12:37:44,668] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +31: [2023-05-10 12:37:44,668] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... + 3: [2023-05-10 12:37:44,669] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... + 0: [2023-05-10 12:37:44,669] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... + 6: [2023-05-10 12:37:44,669] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... + 4: [2023-05-10 12:37:44,671] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... + 9: [2023-05-10 12:37:44,672] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. + 4: [2023-05-10 12:37:44,672] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... + 6: [2023-05-10 12:37:44,673] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... + 6: [2023-05-10 12:37:44,673] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. + 4: [2023-05-10 12:37:44,673] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... + 9: [2023-05-10 12:37:44,674] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt... + 6: [2023-05-10 12:37:44,674] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. + 9: [2023-05-10 12:37:44,674] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. + 9: [2023-05-10 12:37:44,674] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. + 9: [2023-05-10 12:37:44,674] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... + 9: [2023-05-10 12:37:44,674] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... + 9: [2023-05-10 12:37:44,674] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. + 9: [2023-05-10 12:37:44,674] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. + 9: [2023-05-10 12:37:44,674] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... + 7: [2023-05-10 12:37:44,676] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... + 9: [2023-05-10 12:37:44,676] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... + 9: [2023-05-10 12:37:44,676] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +23: [2023-05-10 12:37:44,676] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +23: [2023-05-10 12:37:44,676] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt... + 7: [2023-05-10 12:37:44,676] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +23: [2023-05-10 12:37:44,677] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +23: [2023-05-10 12:37:44,677] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt... + 9: [2023-05-10 12:37:44,677] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt... + 7: [2023-05-10 12:37:44,678] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +10: [2023-05-10 12:37:44,679] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt. +10: [2023-05-10 12:37:44,679] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt. +10: [2023-05-10 12:37:44,679] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt. +21: [2023-05-10 12:37:44,679] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt. +10: [2023-05-10 12:37:44,680] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt. +21: [2023-05-10 12:37:44,680] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt. +21: [2023-05-10 12:37:44,680] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt. + 7: [2023-05-10 12:37:44,680] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... + 0: [2023-05-10 12:37:44,681] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. + 3: [2023-05-10 12:37:44,681] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +21: [2023-05-10 12:37:44,681] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt. + 3: [2023-05-10 12:37:44,682] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt... + 0: [2023-05-10 12:37:44,682] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt... + 6: [2023-05-10 12:37:44,682] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... + 0: [2023-05-10 12:37:44,683] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. + 0: [2023-05-10 12:37:44,683] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt... + 6: [2023-05-10 12:37:44,684] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +31: [2023-05-10 12:37:44,683] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. + 7: [2023-05-10 12:37:44,683] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. + 7: [2023-05-10 12:37:44,683] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. + 7: [2023-05-10 12:37:44,683] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. + 7: [2023-05-10 12:37:44,683] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +31: [2023-05-10 12:37:44,684] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt... +31: [2023-05-10 12:37:44,685] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +31: [2023-05-10 12:37:44,685] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +31: [2023-05-10 12:37:44,685] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt... +31: [2023-05-10 12:37:44,685] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt... + 0: [2023-05-10 12:37:44,685] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. + 0: [2023-05-10 12:37:44,685] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt... + 3: [2023-05-10 12:37:44,685] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. + 3: [2023-05-10 12:37:44,685] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt... + 9: [2023-05-10 12:37:44,685] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +31: [2023-05-10 12:37:44,687] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +31: [2023-05-10 12:37:44,689] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt... +15: [2023-05-10 12:37:44,689] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt. +15: [2023-05-10 12:37:44,689] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt. +15: [2023-05-10 12:37:44,689] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt. + 3: [2023-05-10 12:37:44,690] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +23: [2023-05-10 12:37:44,690] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. +23: [2023-05-10 12:37:44,690] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_00-model_states.pt. + 3: [2023-05-10 12:37:44,690] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. + 3: [2023-05-10 12:37:44,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt... + 3: [2023-05-10 12:37:44,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt... + 9: [2023-05-10 12:37:44,690] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. + 9: [2023-05-10 12:37:44,690] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +10: [2023-05-10 12:37:44,691] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +21: [2023-05-10 12:37:44,691] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +10: [2023-05-10 12:37:44,691] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +21: [2023-05-10 12:37:44,691] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +21: [2023-05-10 12:37:44,691] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... + 7: [2023-05-10 12:37:44,691] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +10: [2023-05-10 12:37:44,691] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +10: [2023-05-10 12:37:44,691] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... + 7: [2023-05-10 12:37:44,692] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt... +23: [2023-05-10 12:37:44,692] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt... +23: [2023-05-10 12:37:44,693] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt... +21: [2023-05-10 12:37:44,693] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... + 7: [2023-05-10 12:37:44,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +15: [2023-05-10 12:37:44,694] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt. + 7: [2023-05-10 12:37:44,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... + 7: [2023-05-10 12:37:44,695] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +12: [2023-05-10 12:37:44,695] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt. +12: [2023-05-10 12:37:44,696] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt. + 9: [2023-05-10 12:37:44,696] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... + 0: [2023-05-10 12:37:44,696] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. + 0: [2023-05-10 12:37:44,696] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt... + 7: [2023-05-10 12:37:44,697] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +12: [2023-05-10 12:37:44,698] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt. +12: [2023-05-10 12:37:44,698] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt. + 9: [2023-05-10 12:37:44,699] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +15: [2023-05-10 12:37:44,700] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +15: [2023-05-10 12:37:44,700] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +24: [2023-05-10 12:37:44,700] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +24: [2023-05-10 12:37:44,700] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +24: [2023-05-10 12:37:44,700] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +24: [2023-05-10 12:37:44,700] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +24: [2023-05-10 12:37:44,700] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +24: [2023-05-10 12:37:44,700] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +15: [2023-05-10 12:37:44,700] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +24: [2023-05-10 12:37:44,700] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. + 9: [2023-05-10 12:37:44,702] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +24: [2023-05-10 12:37:44,702] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... + 7: [2023-05-10 12:37:44,702] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. + 9: [2023-05-10 12:37:44,702] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... + 7: [2023-05-10 12:37:44,702] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt... +31: [2023-05-10 12:37:44,702] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +31: [2023-05-10 12:37:44,702] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +31: [2023-05-10 12:37:44,702] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +31: [2023-05-10 12:37:44,702] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +31: [2023-05-10 12:37:44,703] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +31: [2023-05-10 12:37:44,703] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. + 7: [2023-05-10 12:37:44,703] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. + 7: [2023-05-10 12:37:44,703] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt... +17: [2023-05-10 12:37:44,703] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt. +17: [2023-05-10 12:37:44,703] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt. +31: [2023-05-10 12:37:44,704] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +15: [2023-05-10 12:37:44,704] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +31: [2023-05-10 12:37:44,704] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +12: [2023-05-10 12:37:44,705] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +12: [2023-05-10 12:37:44,705] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +21: [2023-05-10 12:37:44,706] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +21: [2023-05-10 12:37:44,706] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt... +17: [2023-05-10 12:37:44,706] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt. +10: [2023-05-10 12:37:44,707] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +10: [2023-05-10 12:37:44,707] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +10: [2023-05-10 12:37:44,707] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +10: [2023-05-10 12:37:44,707] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt... +10: [2023-05-10 12:37:44,707] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt... +10: [2023-05-10 12:37:44,707] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt... +17: [2023-05-10 12:37:44,707] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt. +10: [2023-05-10 12:37:44,707] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +12: [2023-05-10 12:37:44,708] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +12: [2023-05-10 12:37:44,708] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... + 9: [2023-05-10 12:37:44,709] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +10: [2023-05-10 12:37:44,709] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt... + 7: [2023-05-10 12:37:44,709] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +21: [2023-05-10 12:37:44,709] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +21: [2023-05-10 12:37:44,710] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt... +21: [2023-05-10 12:37:44,710] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +21: [2023-05-10 12:37:44,710] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt... + 7: [2023-05-10 12:37:44,710] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt... +24: [2023-05-10 12:37:44,712] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +21: [2023-05-10 12:37:44,712] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +21: [2023-05-10 12:37:44,712] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt... +17: [2023-05-10 12:37:44,713] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +24: [2023-05-10 12:37:44,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +15: [2023-05-10 12:37:44,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +28: [2023-05-10 12:37:44,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +24: [2023-05-10 12:37:44,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +17: [2023-05-10 12:37:44,714] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +28: [2023-05-10 12:37:44,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +28: [2023-05-10 12:37:44,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +28: [2023-05-10 12:37:44,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +28: [2023-05-10 12:37:44,715] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +15: [2023-05-10 12:37:44,715] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt... +28: [2023-05-10 12:37:44,716] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +28: [2023-05-10 12:37:44,716] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +28: [2023-05-10 12:37:44,716] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +17: [2023-05-10 12:37:44,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +17: [2023-05-10 12:37:44,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +12: [2023-05-10 12:37:44,717] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +31: [2023-05-10 12:37:44,717] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +12: [2023-05-10 12:37:44,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt... +12: [2023-05-10 12:37:44,720] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +12: [2023-05-10 12:37:44,720] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt... +31: [2023-05-10 12:37:44,720] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +15: [2023-05-10 12:37:44,720] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +15: [2023-05-10 12:37:44,720] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +15: [2023-05-10 12:37:44,721] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt... +15: [2023-05-10 12:37:44,721] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt... +12: [2023-05-10 12:37:44,721] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +12: [2023-05-10 12:37:44,721] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt... +15: [2023-05-10 12:37:44,722] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +15: [2023-05-10 12:37:44,722] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt... +24: [2023-05-10 12:37:44,722] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +12: [2023-05-10 12:37:44,722] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +12: [2023-05-10 12:37:44,722] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt... +24: [2023-05-10 12:37:44,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +10: [2023-05-10 12:37:44,725] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +10: [2023-05-10 12:37:44,725] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +10: [2023-05-10 12:37:44,725] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +10: [2023-05-10 12:37:44,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +10: [2023-05-10 12:37:44,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +10: [2023-05-10 12:37:44,725] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +10: [2023-05-10 12:37:44,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +24: [2023-05-10 12:37:44,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +10: [2023-05-10 12:37:44,726] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +31: [2023-05-10 12:37:44,726] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +31: [2023-05-10 12:37:44,728] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +31: [2023-05-10 12:37:44,729] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +24: [2023-05-10 12:37:44,729] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +28: [2023-05-10 12:37:44,730] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +31: [2023-05-10 12:37:44,732] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +17: [2023-05-10 12:37:44,732] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. + 2: [2023-05-10 12:37:44,733] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. + 2: [2023-05-10 12:37:44,733] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. + 2: [2023-05-10 12:37:44,733] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. + 2: [2023-05-10 12:37:44,733] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... + 2: [2023-05-10 12:37:44,733] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +17: [2023-05-10 12:37:44,733] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +17: [2023-05-10 12:37:44,733] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +17: [2023-05-10 12:37:44,733] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt... +17: [2023-05-10 12:37:44,733] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt... +17: [2023-05-10 12:37:44,733] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt... +17: [2023-05-10 12:37:44,733] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +17: [2023-05-10 12:37:44,733] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt... + 2: [2023-05-10 12:37:44,734] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... + 2: [2023-05-10 12:37:44,734] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... + 2: [2023-05-10 12:37:44,735] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +31: [2023-05-10 12:37:44,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +13: [2023-05-10 12:37:44,738] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt. +13: [2023-05-10 12:37:44,739] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt. +28: [2023-05-10 12:37:44,739] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +13: [2023-05-10 12:37:44,739] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt. +24: [2023-05-10 12:37:44,739] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +13: [2023-05-10 12:37:44,739] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt. +31: [2023-05-10 12:37:44,740] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... + 2: [2023-05-10 12:37:44,743] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt. + 2: [2023-05-10 12:37:44,743] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt. + 2: [2023-05-10 12:37:44,743] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt. +28: [2023-05-10 12:37:44,743] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. + 2: [2023-05-10 12:37:44,744] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt. +10: [2023-05-10 12:37:44,743] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +10: [2023-05-10 12:37:44,743] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +10: [2023-05-10 12:37:44,744] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +28: [2023-05-10 12:37:44,744] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. + 2: [2023-05-10 12:37:44,747] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +13: [2023-05-10 12:37:44,748] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +28: [2023-05-10 12:37:44,750] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +10: [2023-05-10 12:37:44,750] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +13: [2023-05-10 12:37:44,750] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +13: [2023-05-10 12:37:44,750] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +13: [2023-05-10 12:37:44,751] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +28: [2023-05-10 12:37:44,753] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +28: [2023-05-10 12:37:44,753] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +10: [2023-05-10 12:37:44,754] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... + 2: [2023-05-10 12:37:44,754] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +10: [2023-05-10 12:37:44,754] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... + 2: [2023-05-10 12:37:44,754] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... + 2: [2023-05-10 12:37:44,754] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... + 2: [2023-05-10 12:37:44,754] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +10: [2023-05-10 12:37:44,754] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +28: [2023-05-10 12:37:44,758] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +10: [2023-05-10 12:37:44,758] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... + 2: [2023-05-10 12:37:44,759] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +26: [2023-05-10 12:37:44,762] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +26: [2023-05-10 12:37:44,762] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +26: [2023-05-10 12:37:44,762] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +26: [2023-05-10 12:37:44,762] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +26: [2023-05-10 12:37:44,762] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +26: [2023-05-10 12:37:44,762] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +26: [2023-05-10 12:37:44,763] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +26: [2023-05-10 12:37:44,763] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... + 2: [2023-05-10 12:37:44,763] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. + 2: [2023-05-10 12:37:44,765] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +13: [2023-05-10 12:37:44,766] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +25: [2023-05-10 12:37:44,767] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +25: [2023-05-10 12:37:44,767] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +25: [2023-05-10 12:37:44,767] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +25: [2023-05-10 12:37:44,767] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +13: [2023-05-10 12:37:44,767] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +13: [2023-05-10 12:37:44,767] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. + 2: [2023-05-10 12:37:44,768] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +13: [2023-05-10 12:37:44,769] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt... +13: [2023-05-10 12:37:44,769] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt... +13: [2023-05-10 12:37:44,769] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt... +25: [2023-05-10 12:37:44,770] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt. +25: [2023-05-10 12:37:44,770] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt. +25: [2023-05-10 12:37:44,771] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +25: [2023-05-10 12:37:44,771] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +25: [2023-05-10 12:37:44,771] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... + 2: [2023-05-10 12:37:44,771] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +25: [2023-05-10 12:37:44,771] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... + 2: [2023-05-10 12:37:44,772] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt... +23: [2023-05-10 12:37:44,772] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt. +23: [2023-05-10 12:37:44,772] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt. + 2: [2023-05-10 12:37:44,772] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +25: [2023-05-10 12:37:44,773] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt. + 2: [2023-05-10 12:37:44,774] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. + 2: [2023-05-10 12:37:44,774] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. + 2: [2023-05-10 12:37:44,774] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt... + 2: [2023-05-10 12:37:44,774] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt... +26: [2023-05-10 12:37:44,774] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +25: [2023-05-10 12:37:44,774] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt. +26: [2023-05-10 12:37:44,775] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +23: [2023-05-10 12:37:44,777] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt. +23: [2023-05-10 12:37:44,777] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt. + 2: [2023-05-10 12:37:44,777] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. + 2: [2023-05-10 12:37:44,778] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... + 2: [2023-05-10 12:37:44,778] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt... +13: [2023-05-10 12:37:44,778] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +26: [2023-05-10 12:37:44,778] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +26: [2023-05-10 12:37:44,778] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. + 2: [2023-05-10 12:37:44,778] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +25: [2023-05-10 12:37:44,779] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +13: [2023-05-10 12:37:44,780] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt... +25: [2023-05-10 12:37:44,781] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +23: [2023-05-10 12:37:44,781] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +25: [2023-05-10 12:37:44,782] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +26: [2023-05-10 12:37:44,783] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +23: [2023-05-10 12:37:44,783] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +17: [2023-05-10 12:37:44,785] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +17: [2023-05-10 12:37:44,785] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +17: [2023-05-10 12:37:44,785] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +17: [2023-05-10 12:37:44,785] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +25: [2023-05-10 12:37:44,785] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +17: [2023-05-10 12:37:44,785] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +17: [2023-05-10 12:37:44,785] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +26: [2023-05-10 12:37:44,785] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +27: [2023-05-10 12:37:44,786] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt. +27: [2023-05-10 12:37:44,786] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt. +27: [2023-05-10 12:37:44,786] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt. +27: [2023-05-10 12:37:44,786] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_23-model_01-model_states.pt. +17: [2023-05-10 12:37:44,787] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +17: [2023-05-10 12:37:44,787] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +23: [2023-05-10 12:37:44,787] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +26: [2023-05-10 12:37:44,788] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +25: [2023-05-10 12:37:44,787] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +23: [2023-05-10 12:37:44,788] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +25: [2023-05-10 12:37:44,789] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +25: [2023-05-10 12:37:44,789] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +26: [2023-05-10 12:37:44,790] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... + 5: [2023-05-10 12:37:44,790] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. + 5: [2023-05-10 12:37:44,790] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. + 5: [2023-05-10 12:37:44,790] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. + 5: [2023-05-10 12:37:44,790] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... + 5: [2023-05-10 12:37:44,790] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... + 5: [2023-05-10 12:37:44,790] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... + 5: [2023-05-10 12:37:44,790] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. + 5: [2023-05-10 12:37:44,790] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +25: [2023-05-10 12:37:44,793] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +27: [2023-05-10 12:37:44,795] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +27: [2023-05-10 12:37:44,795] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +17: [2023-05-10 12:37:44,797] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +25: [2023-05-10 12:37:44,797] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +23: [2023-05-10 12:37:44,797] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +27: [2023-05-10 12:37:44,798] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +27: [2023-05-10 12:37:44,798] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt... +23: [2023-05-10 12:37:44,798] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt... +25: [2023-05-10 12:37:44,799] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... + 1: [2023-05-10 12:37:44,800] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt. + 1: [2023-05-10 12:37:44,800] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt. +17: [2023-05-10 12:37:44,800] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. + 1: [2023-05-10 12:37:44,800] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt. +25: [2023-05-10 12:37:44,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... + 1: [2023-05-10 12:37:44,800] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt. +25: [2023-05-10 12:37:44,802] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +23: [2023-05-10 12:37:44,802] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +23: [2023-05-10 12:37:44,803] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt... +25: [2023-05-10 12:37:44,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +23: [2023-05-10 12:37:44,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +23: [2023-05-10 12:37:44,803] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt... +25: [2023-05-10 12:37:44,803] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +25: [2023-05-10 12:37:44,804] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +25: [2023-05-10 12:37:44,804] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt... +25: [2023-05-10 12:37:44,804] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt... +25: [2023-05-10 12:37:44,804] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt... + 5: [2023-05-10 12:37:44,806] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. + 5: [2023-05-10 12:37:44,806] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. + 5: [2023-05-10 12:37:44,806] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +27: [2023-05-10 12:37:44,806] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. + 5: [2023-05-10 12:37:44,806] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +27: [2023-05-10 12:37:44,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt... +17: [2023-05-10 12:37:44,808] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +23: [2023-05-10 12:37:44,808] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +23: [2023-05-10 12:37:44,808] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt... + 1: [2023-05-10 12:37:44,809] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... + 1: [2023-05-10 12:37:44,809] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... + 1: [2023-05-10 12:37:44,809] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... + 1: [2023-05-10 12:37:44,810] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +25: [2023-05-10 12:37:44,810] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +25: [2023-05-10 12:37:44,810] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt... +17: [2023-05-10 12:37:44,811] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +17: [2023-05-10 12:37:44,812] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +27: [2023-05-10 12:37:44,812] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +27: [2023-05-10 12:37:44,812] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt... +27: [2023-05-10 12:37:44,812] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +27: [2023-05-10 12:37:44,813] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt... +16: [2023-05-10 12:37:44,815] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +16: [2023-05-10 12:37:44,815] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +16: [2023-05-10 12:37:44,815] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +16: [2023-05-10 12:37:44,815] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +16: [2023-05-10 12:37:44,815] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +16: [2023-05-10 12:37:44,815] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +16: [2023-05-10 12:37:44,815] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +16: [2023-05-10 12:37:44,815] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +17: [2023-05-10 12:37:44,815] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +24: [2023-05-10 12:37:44,815] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt. +24: [2023-05-10 12:37:44,815] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt. +24: [2023-05-10 12:37:44,815] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt. +24: [2023-05-10 12:37:44,816] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt. + 5: [2023-05-10 12:37:44,816] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... + 5: [2023-05-10 12:37:44,816] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +14: [2023-05-10 12:37:44,816] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt. +14: [2023-05-10 12:37:44,816] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt. +14: [2023-05-10 12:37:44,816] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt. + 5: [2023-05-10 12:37:44,817] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... + 5: [2023-05-10 12:37:44,817] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +14: [2023-05-10 12:37:44,817] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt. +23: [2023-05-10 12:37:44,818] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +23: [2023-05-10 12:37:44,818] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +23: [2023-05-10 12:37:44,819] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +23: [2023-05-10 12:37:44,819] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +23: [2023-05-10 12:37:44,820] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +23: [2023-05-10 12:37:44,820] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +23: [2023-05-10 12:37:44,822] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +27: [2023-05-10 12:37:44,822] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_00-model_states.pt. +23: [2023-05-10 12:37:44,822] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +14: [2023-05-10 12:37:44,823] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +14: [2023-05-10 12:37:44,823] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +17: [2023-05-10 12:37:44,823] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +14: [2023-05-10 12:37:44,824] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +27: [2023-05-10 12:37:44,824] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt... +14: [2023-05-10 12:37:44,824] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +14: [2023-05-10 12:37:44,824] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +24: [2023-05-10 12:37:44,824] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +14: [2023-05-10 12:37:44,824] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +14: [2023-05-10 12:37:44,824] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +14: [2023-05-10 12:37:44,824] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +24: [2023-05-10 12:37:44,824] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +24: [2023-05-10 12:37:44,824] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +17: [2023-05-10 12:37:44,826] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +26: [2023-05-10 12:37:44,826] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt. +26: [2023-05-10 12:37:44,826] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt. +26: [2023-05-10 12:37:44,826] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt. +24: [2023-05-10 12:37:44,827] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +16: [2023-05-10 12:37:44,827] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +16: [2023-05-10 12:37:44,828] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. + 1: [2023-05-10 12:37:44,829] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. + 1: [2023-05-10 12:37:44,829] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +23: [2023-05-10 12:37:44,830] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. + 1: [2023-05-10 12:37:44,830] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt... + 1: [2023-05-10 12:37:44,830] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt... +26: [2023-05-10 12:37:44,830] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt. + 1: [2023-05-10 12:37:44,830] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. + 1: [2023-05-10 12:37:44,830] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. + 1: [2023-05-10 12:37:44,830] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt... + 1: [2023-05-10 12:37:44,830] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt... +14: [2023-05-10 12:37:44,830] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +14: [2023-05-10 12:37:44,830] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +23: [2023-05-10 12:37:44,831] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +14: [2023-05-10 12:37:44,831] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +14: [2023-05-10 12:37:44,831] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +16: [2023-05-10 12:37:44,831] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +16: [2023-05-10 12:37:44,831] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +12: [2023-05-10 12:37:44,835] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +12: [2023-05-10 12:37:44,835] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +12: [2023-05-10 12:37:44,835] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +12: [2023-05-10 12:37:44,835] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +12: [2023-05-10 12:37:44,835] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +12: [2023-05-10 12:37:44,835] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +24: [2023-05-10 12:37:44,835] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +16: [2023-05-10 12:37:44,836] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +12: [2023-05-10 12:37:44,836] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +24: [2023-05-10 12:37:44,836] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt... +14: [2023-05-10 12:37:44,837] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +12: [2023-05-10 12:37:44,838] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +26: [2023-05-10 12:37:44,838] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +23: [2023-05-10 12:37:44,838] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +26: [2023-05-10 12:37:44,838] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +26: [2023-05-10 12:37:44,839] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +24: [2023-05-10 12:37:44,840] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +24: [2023-05-10 12:37:44,840] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +24: [2023-05-10 12:37:44,840] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt... +24: [2023-05-10 12:37:44,840] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt... +23: [2023-05-10 12:37:44,840] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +16: [2023-05-10 12:37:44,840] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +16: [2023-05-10 12:37:44,841] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +16: [2023-05-10 12:37:44,842] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +26: [2023-05-10 12:37:44,842] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +14: [2023-05-10 12:37:44,844] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +23: [2023-05-10 12:37:44,845] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +14: [2023-05-10 12:37:44,845] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +14: [2023-05-10 12:37:44,849] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +14: [2023-05-10 12:37:44,850] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +12: [2023-05-10 12:37:44,850] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +12: [2023-05-10 12:37:44,850] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +26: [2023-05-10 12:37:44,850] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +26: [2023-05-10 12:37:44,851] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt... +14: [2023-05-10 12:37:44,852] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +24: [2023-05-10 12:37:44,853] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +14: [2023-05-10 12:37:44,853] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt... +14: [2023-05-10 12:37:44,853] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +14: [2023-05-10 12:37:44,854] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +24: [2023-05-10 12:37:44,854] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt... +14: [2023-05-10 12:37:44,854] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt... +23: [2023-05-10 12:37:44,854] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +23: [2023-05-10 12:37:44,854] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +14: [2023-05-10 12:37:44,855] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt... +26: [2023-05-10 12:37:44,855] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +26: [2023-05-10 12:37:44,855] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt... +12: [2023-05-10 12:37:44,855] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +14: [2023-05-10 12:37:44,857] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +14: [2023-05-10 12:37:44,858] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +14: [2023-05-10 12:37:44,859] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +14: [2023-05-10 12:37:44,860] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +12: [2023-05-10 12:37:44,860] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +14: [2023-05-10 12:37:44,860] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt... +12: [2023-05-10 12:37:44,860] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +26: [2023-05-10 12:37:44,860] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +26: [2023-05-10 12:37:44,860] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt... +23: [2023-05-10 12:37:44,863] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +12: [2023-05-10 12:37:44,865] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +12: [2023-05-10 12:37:44,867] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +26: [2023-05-10 12:37:44,868] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +26: [2023-05-10 12:37:44,869] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt... + 3: [2023-05-10 12:37:44,870] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. + 3: [2023-05-10 12:37:44,870] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. + 3: [2023-05-10 12:37:44,870] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... + 3: [2023-05-10 12:37:44,870] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +11: [2023-05-10 12:37:44,872] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +11: [2023-05-10 12:37:44,872] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +12: [2023-05-10 12:37:44,873] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... + 3: [2023-05-10 12:37:44,873] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. + 3: [2023-05-10 12:37:44,873] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. + 3: [2023-05-10 12:37:44,873] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... + 3: [2023-05-10 12:37:44,873] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... + 8: [2023-05-10 12:37:44,874] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. + 8: [2023-05-10 12:37:44,874] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... + 8: [2023-05-10 12:37:44,874] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. + 8: [2023-05-10 12:37:44,874] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. + 8: [2023-05-10 12:37:44,874] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. + 8: [2023-05-10 12:37:44,874] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... + 8: [2023-05-10 12:37:44,874] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... + 8: [2023-05-10 12:37:44,874] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +11: [2023-05-10 12:37:44,874] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +11: [2023-05-10 12:37:44,875] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +18: [2023-05-10 12:37:44,875] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +18: [2023-05-10 12:37:44,875] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +18: [2023-05-10 12:37:44,875] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +18: [2023-05-10 12:37:44,875] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +18: [2023-05-10 12:37:44,875] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +18: [2023-05-10 12:37:44,875] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +18: [2023-05-10 12:37:44,875] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +30: [2023-05-10 12:37:44,875] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +30: [2023-05-10 12:37:44,875] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +18: [2023-05-10 12:37:44,875] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +30: [2023-05-10 12:37:44,875] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +30: [2023-05-10 12:37:44,876] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +30: [2023-05-10 12:37:44,876] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +30: [2023-05-10 12:37:44,877] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +15: [2023-05-10 12:37:44,877] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +15: [2023-05-10 12:37:44,877] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +15: [2023-05-10 12:37:44,877] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +15: [2023-05-10 12:37:44,877] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +15: [2023-05-10 12:37:44,877] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +15: [2023-05-10 12:37:44,877] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +30: [2023-05-10 12:37:44,877] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +15: [2023-05-10 12:37:44,878] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +11: [2023-05-10 12:37:44,877] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +11: [2023-05-10 12:37:44,877] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +11: [2023-05-10 12:37:44,877] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... + 0: [2023-05-10 12:37:44,878] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. + 0: [2023-05-10 12:37:44,878] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. + 0: [2023-05-10 12:37:44,878] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. + 0: [2023-05-10 12:37:44,878] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... + 0: [2023-05-10 12:37:44,878] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... + 0: [2023-05-10 12:37:44,878] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... + 0: [2023-05-10 12:37:44,878] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +19: [2023-05-10 12:37:44,878] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +19: [2023-05-10 12:37:44,878] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +19: [2023-05-10 12:37:44,878] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +19: [2023-05-10 12:37:44,878] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... + 0: [2023-05-10 12:37:44,878] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +30: [2023-05-10 12:37:44,879] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +11: [2023-05-10 12:37:44,879] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +13: [2023-05-10 12:37:44,879] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +22: [2023-05-10 12:37:44,879] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +22: [2023-05-10 12:37:44,879] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +13: [2023-05-10 12:37:44,879] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +22: [2023-05-10 12:37:44,879] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +22: [2023-05-10 12:37:44,879] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +13: [2023-05-10 12:37:44,879] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +13: [2023-05-10 12:37:44,879] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +13: [2023-05-10 12:37:44,879] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +13: [2023-05-10 12:37:44,879] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +13: [2023-05-10 12:37:44,879] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +13: [2023-05-10 12:37:44,879] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +15: [2023-05-10 12:37:44,880] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +19: [2023-05-10 12:37:44,880] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +19: [2023-05-10 12:37:44,880] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +19: [2023-05-10 12:37:44,880] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +20: [2023-05-10 12:37:44,880] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +20: [2023-05-10 12:37:44,881] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +20: [2023-05-10 12:37:44,881] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +20: [2023-05-10 12:37:44,881] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +22: [2023-05-10 12:37:44,881] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +22: [2023-05-10 12:37:44,881] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +22: [2023-05-10 12:37:44,881] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +22: [2023-05-10 12:37:44,881] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +20: [2023-05-10 12:37:44,881] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +20: [2023-05-10 12:37:44,881] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +20: [2023-05-10 12:37:44,882] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +19: [2023-05-10 12:37:44,882] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +20: [2023-05-10 12:37:44,882] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... + 3: [2023-05-10 12:37:44,885] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +30: [2023-05-10 12:37:44,887] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +11: [2023-05-10 12:37:44,888] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +15: [2023-05-10 12:37:44,888] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +11: [2023-05-10 12:37:44,889] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +21: [2023-05-10 12:37:44,889] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +21: [2023-05-10 12:37:44,889] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +21: [2023-05-10 12:37:44,889] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... + 8: [2023-05-10 12:37:44,889] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +21: [2023-05-10 12:37:44,889] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +21: [2023-05-10 12:37:44,889] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +21: [2023-05-10 12:37:44,889] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +21: [2023-05-10 12:37:44,890] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +13: [2023-05-10 12:37:44,890] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +19: [2023-05-10 12:37:44,890] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +11: [2023-05-10 12:37:44,890] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. + 3: [2023-05-10 12:37:44,890] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. + 3: [2023-05-10 12:37:44,890] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +21: [2023-05-10 12:37:44,891] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +30: [2023-05-10 12:37:44,891] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +15: [2023-05-10 12:37:44,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +30: [2023-05-10 12:37:44,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +22: [2023-05-10 12:37:44,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +20: [2023-05-10 12:37:44,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. + 8: [2023-05-10 12:37:44,893] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. + 8: [2023-05-10 12:37:44,893] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. + 8: [2023-05-10 12:37:44,893] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. + 3: [2023-05-10 12:37:44,893] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. + 3: [2023-05-10 12:37:44,893] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +15: [2023-05-10 12:37:44,893] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +19: [2023-05-10 12:37:44,894] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +20: [2023-05-10 12:37:44,896] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +20: [2023-05-10 12:37:44,896] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +30: [2023-05-10 12:37:44,897] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +15: [2023-05-10 12:37:44,897] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... + 8: [2023-05-10 12:37:44,898] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +13: [2023-05-10 12:37:44,898] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +13: [2023-05-10 12:37:44,898] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +18: [2023-05-10 12:37:44,898] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +18: [2023-05-10 12:37:44,898] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +13: [2023-05-10 12:37:44,898] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +13: [2023-05-10 12:37:44,899] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +22: [2023-05-10 12:37:44,899] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +22: [2023-05-10 12:37:44,899] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +11: [2023-05-10 12:37:44,899] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +11: [2023-05-10 12:37:44,899] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +11: [2023-05-10 12:37:44,899] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +19: [2023-05-10 12:37:44,900] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +19: [2023-05-10 12:37:44,900] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +21: [2023-05-10 12:37:44,900] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +22: [2023-05-10 12:37:44,900] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +30: [2023-05-10 12:37:44,901] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... + 3: [2023-05-10 12:37:44,902] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +20: [2023-05-10 12:37:44,903] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +30: [2023-05-10 12:37:44,903] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +18: [2023-05-10 12:37:44,898] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +15: [2023-05-10 12:37:44,903] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +18: [2023-05-10 12:37:44,899] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +19: [2023-05-10 12:37:44,903] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... + 8: [2023-05-10 12:37:44,904] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +21: [2023-05-10 12:37:44,904] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +21: [2023-05-10 12:37:44,904] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. + 0: [2023-05-10 12:37:44,904] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +11: [2023-05-10 12:37:44,904] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. + 0: [2023-05-10 12:37:44,905] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +15: [2023-05-10 12:37:44,905] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... + 3: [2023-05-10 12:37:44,905] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... + 3: [2023-05-10 12:37:44,905] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +20: [2023-05-10 12:37:44,906] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... + 8: [2023-05-10 12:37:44,906] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... + 8: [2023-05-10 12:37:44,906] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +22: [2023-05-10 12:37:44,906] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +20: [2023-05-10 12:37:44,906] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +19: [2023-05-10 12:37:44,907] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +19: [2023-05-10 12:37:44,908] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +22: [2023-05-10 12:37:44,908] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +20: [2023-05-10 12:37:44,908] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +18: [2023-05-10 12:37:44,909] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +18: [2023-05-10 12:37:44,909] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +22: [2023-05-10 12:37:44,910] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +21: [2023-05-10 12:37:44,910] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... + 0: [2023-05-10 12:37:44,910] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +22: [2023-05-10 12:37:44,910] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +13: [2023-05-10 12:37:44,910] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +18: [2023-05-10 12:37:44,911] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +13: [2023-05-10 12:37:44,911] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +13: [2023-05-10 12:37:44,911] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +18: [2023-05-10 12:37:44,911] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +30: [2023-05-10 12:37:44,912] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +11: [2023-05-10 12:37:44,913] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... + 0: [2023-05-10 12:37:44,913] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +21: [2023-05-10 12:37:44,914] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +21: [2023-05-10 12:37:44,914] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... + 0: [2023-05-10 12:37:44,914] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +19: [2023-05-10 12:37:44,916] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... + 0: [2023-05-10 12:37:44,916] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +20: [2023-05-10 12:37:44,917] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +15: [2023-05-10 12:37:44,917] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +19: [2023-05-10 12:37:44,918] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt. +19: [2023-05-10 12:37:44,918] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt. +19: [2023-05-10 12:37:44,918] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt. +19: [2023-05-10 12:37:44,918] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt. + 0: [2023-05-10 12:37:44,920] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +30: [2023-05-10 12:37:44,921] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +21: [2023-05-10 12:37:44,921] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. + 0: [2023-05-10 12:37:44,923] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +15: [2023-05-10 12:37:44,926] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +19: [2023-05-10 12:37:44,926] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +19: [2023-05-10 12:37:44,928] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +19: [2023-05-10 12:37:44,928] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +19: [2023-05-10 12:37:44,928] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +21: [2023-05-10 12:37:44,929] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +19: [2023-05-10 12:37:44,941] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +19: [2023-05-10 12:37:44,941] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt... +19: [2023-05-10 12:37:44,943] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +19: [2023-05-10 12:37:44,943] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt... +19: [2023-05-10 12:37:44,945] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +19: [2023-05-10 12:37:44,945] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt... +19: [2023-05-10 12:37:44,945] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +19: [2023-05-10 12:37:44,946] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt... + 5: [2023-05-10 12:37:44,970] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt. + 5: [2023-05-10 12:37:44,970] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt. + 5: [2023-05-10 12:37:44,970] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt. + 5: [2023-05-10 12:37:44,971] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt. +28: [2023-05-10 12:37:44,973] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt. +28: [2023-05-10 12:37:44,973] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt. +15: [2023-05-10 12:37:44,973] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt. +30: [2023-05-10 12:37:44,973] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt. +30: [2023-05-10 12:37:44,973] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt. +30: [2023-05-10 12:37:44,973] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt. +15: [2023-05-10 12:37:44,973] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt. +15: [2023-05-10 12:37:44,973] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt. +15: [2023-05-10 12:37:44,974] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt. +30: [2023-05-10 12:37:44,973] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt. +28: [2023-05-10 12:37:44,973] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt. +28: [2023-05-10 12:37:44,974] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt. +29: [2023-05-10 12:37:44,975] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt. +29: [2023-05-10 12:37:44,975] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt. +29: [2023-05-10 12:37:44,975] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt. +29: [2023-05-10 12:37:44,976] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt. +27: [2023-05-10 12:37:44,978] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +27: [2023-05-10 12:37:44,978] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +27: [2023-05-10 12:37:44,978] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +27: [2023-05-10 12:37:44,978] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +27: [2023-05-10 12:37:44,978] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +27: [2023-05-10 12:37:44,978] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +27: [2023-05-10 12:37:44,978] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +27: [2023-05-10 12:37:44,978] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... + 8: [2023-05-10 12:37:44,980] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt. + 8: [2023-05-10 12:37:44,980] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt. + 8: [2023-05-10 12:37:44,980] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt. + 5: [2023-05-10 12:37:44,980] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... + 8: [2023-05-10 12:37:44,981] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt. + 5: [2023-05-10 12:37:44,981] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... + 5: [2023-05-10 12:37:44,981] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... + 5: [2023-05-10 12:37:44,981] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +28: [2023-05-10 12:37:44,982] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +30: [2023-05-10 12:37:44,983] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +28: [2023-05-10 12:37:44,983] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +28: [2023-05-10 12:37:44,983] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +30: [2023-05-10 12:37:44,983] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +30: [2023-05-10 12:37:44,983] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +15: [2023-05-10 12:37:44,984] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +15: [2023-05-10 12:37:44,985] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +28: [2023-05-10 12:37:44,985] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +29: [2023-05-10 12:37:44,985] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +15: [2023-05-10 12:37:44,985] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +29: [2023-05-10 12:37:44,986] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +29: [2023-05-10 12:37:44,986] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +30: [2023-05-10 12:37:44,986] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +29: [2023-05-10 12:37:44,987] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +15: [2023-05-10 12:37:44,987] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +16: [2023-05-10 12:37:44,988] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt. +16: [2023-05-10 12:37:44,988] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt. +16: [2023-05-10 12:37:44,988] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt. +11: [2023-05-10 12:37:44,988] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt. +11: [2023-05-10 12:37:44,988] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt. +11: [2023-05-10 12:37:44,988] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt. +16: [2023-05-10 12:37:44,988] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt. +11: [2023-05-10 12:37:44,990] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt. + 0: [2023-05-10 12:37:44,990] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt. + 0: [2023-05-10 12:37:44,990] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt. + 0: [2023-05-10 12:37:44,990] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt. + 0: [2023-05-10 12:37:44,990] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt. +27: [2023-05-10 12:37:44,990] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +27: [2023-05-10 12:37:44,990] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. + 1: [2023-05-10 12:37:44,991] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. + 1: [2023-05-10 12:37:44,991] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. + 1: [2023-05-10 12:37:44,991] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. + 1: [2023-05-10 12:37:44,991] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... + 1: [2023-05-10 12:37:44,991] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... + 1: [2023-05-10 12:37:44,991] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +29: [2023-05-10 12:37:44,991] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +29: [2023-05-10 12:37:44,991] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... + 1: [2023-05-10 12:37:44,991] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. + 1: [2023-05-10 12:37:44,991] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +29: [2023-05-10 12:37:44,991] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +29: [2023-05-10 12:37:44,991] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... + 5: [2023-05-10 12:37:44,991] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +29: [2023-05-10 12:37:44,992] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +29: [2023-05-10 12:37:44,992] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. + 8: [2023-05-10 12:37:44,992] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... + 8: [2023-05-10 12:37:44,992] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... + 5: [2023-05-10 12:37:44,992] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt... + 8: [2023-05-10 12:37:44,992] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +29: [2023-05-10 12:37:44,992] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... + 8: [2023-05-10 12:37:44,992] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +18: [2023-05-10 12:37:44,992] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt. +18: [2023-05-10 12:37:44,992] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt. +18: [2023-05-10 12:37:44,992] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt. +18: [2023-05-10 12:37:44,992] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt. + 6: [2023-05-10 12:37:44,993] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt. +31: [2023-05-10 12:37:44,993] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt. +31: [2023-05-10 12:37:44,993] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt. + 6: [2023-05-10 12:37:44,993] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt. + 6: [2023-05-10 12:37:44,993] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt. + 6: [2023-05-10 12:37:44,993] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt. +29: [2023-05-10 12:37:44,993] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +31: [2023-05-10 12:37:44,993] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt. +27: [2023-05-10 12:37:44,994] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +27: [2023-05-10 12:37:44,994] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +31: [2023-05-10 12:37:44,994] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt. +30: [2023-05-10 12:37:44,996] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. + 5: [2023-05-10 12:37:44,997] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. + 5: [2023-05-10 12:37:44,997] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt... +11: [2023-05-10 12:37:44,997] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +28: [2023-05-10 12:37:44,997] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +28: [2023-05-10 12:37:44,998] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +30: [2023-05-10 12:37:44,998] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt... +28: [2023-05-10 12:37:44,998] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt... +28: [2023-05-10 12:37:44,998] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt... +11: [2023-05-10 12:37:44,999] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +11: [2023-05-10 12:37:44,999] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +16: [2023-05-10 12:37:44,999] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +27: [2023-05-10 12:37:44,999] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +16: [2023-05-10 12:37:44,999] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... + 5: [2023-05-10 12:37:44,999] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. + 5: [2023-05-10 12:37:44,999] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt... + 0: [2023-05-10 12:37:44,999] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... + 0: [2023-05-10 12:37:44,999] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +11: [2023-05-10 12:37:44,999] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... + 0: [2023-05-10 12:37:45,000] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +16: [2023-05-10 12:37:45,000] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +16: [2023-05-10 12:37:45,000] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +15: [2023-05-10 12:37:45,000] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. + 5: [2023-05-10 12:37:45,001] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +28: [2023-05-10 12:37:45,001] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +28: [2023-05-10 12:37:45,001] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt... +18: [2023-05-10 12:37:45,001] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +18: [2023-05-10 12:37:45,001] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +18: [2023-05-10 12:37:45,002] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... + 6: [2023-05-10 12:37:45,002] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... + 5: [2023-05-10 12:37:45,002] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt... + 0: [2023-05-10 12:37:45,002] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +31: [2023-05-10 12:37:45,002] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +27: [2023-05-10 12:37:45,002] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +30: [2023-05-10 12:37:45,002] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +15: [2023-05-10 12:37:45,002] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt... +30: [2023-05-10 12:37:45,002] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt... +31: [2023-05-10 12:37:45,002] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... + 6: [2023-05-10 12:37:45,002] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... + 6: [2023-05-10 12:37:45,002] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +15: [2023-05-10 12:37:45,003] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +15: [2023-05-10 12:37:45,003] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt... +29: [2023-05-10 12:37:45,003] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +27: [2023-05-10 12:37:45,003] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... + 6: [2023-05-10 12:37:45,003] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +18: [2023-05-10 12:37:45,004] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... + 3: [2023-05-10 12:37:45,004] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt. + 3: [2023-05-10 12:37:45,004] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt. +31: [2023-05-10 12:37:45,004] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... + 3: [2023-05-10 12:37:45,004] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt. +31: [2023-05-10 12:37:45,004] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... + 3: [2023-05-10 12:37:45,004] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt. +27: [2023-05-10 12:37:45,005] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +30: [2023-05-10 12:37:45,007] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +30: [2023-05-10 12:37:45,008] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt... + 8: [2023-05-10 12:37:45,008] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. + 8: [2023-05-10 12:37:45,008] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. + 8: [2023-05-10 12:37:45,008] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt... + 8: [2023-05-10 12:37:45,008] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. + 8: [2023-05-10 12:37:45,008] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt... +29: [2023-05-10 12:37:45,008] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. + 8: [2023-05-10 12:37:45,008] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt... +29: [2023-05-10 12:37:45,009] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +28: [2023-05-10 12:37:45,009] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +29: [2023-05-10 12:37:45,010] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt... +29: [2023-05-10 12:37:45,010] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt... +15: [2023-05-10 12:37:45,010] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +29: [2023-05-10 12:37:45,010] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +29: [2023-05-10 12:37:45,010] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt... +28: [2023-05-10 12:37:45,011] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt... +15: [2023-05-10 12:37:45,011] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt... +11: [2023-05-10 12:37:45,011] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +29: [2023-05-10 12:37:45,012] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... + 1: [2023-05-10 12:37:45,012] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. + 1: [2023-05-10 12:37:45,012] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +11: [2023-05-10 12:37:45,012] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt... +29: [2023-05-10 12:37:45,012] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +11: [2023-05-10 12:37:45,012] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +11: [2023-05-10 12:37:45,013] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt... + 1: [2023-05-10 12:37:45,013] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. + 3: [2023-05-10 12:37:45,013] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... + 1: [2023-05-10 12:37:45,014] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. + 8: [2023-05-10 12:37:45,014] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. + 3: [2023-05-10 12:37:45,014] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +11: [2023-05-10 12:37:45,014] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. + 8: [2023-05-10 12:37:45,014] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt... +11: [2023-05-10 12:37:45,014] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt... + 0: [2023-05-10 12:37:45,014] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +29: [2023-05-10 12:37:45,014] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. + 3: [2023-05-10 12:37:45,014] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +29: [2023-05-10 12:37:45,014] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt... + 0: [2023-05-10 12:37:45,015] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt... + 3: [2023-05-10 12:37:45,015] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +29: [2023-05-10 12:37:45,015] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +11: [2023-05-10 12:37:45,015] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +16: [2023-05-10 12:37:45,015] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +11: [2023-05-10 12:37:45,015] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt... +16: [2023-05-10 12:37:45,015] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt... +16: [2023-05-10 12:37:45,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +16: [2023-05-10 12:37:45,017] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt... +18: [2023-05-10 12:37:45,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +18: [2023-05-10 12:37:45,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +15: [2023-05-10 12:37:45,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +18: [2023-05-10 12:37:45,018] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt... +18: [2023-05-10 12:37:45,018] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt... +16: [2023-05-10 12:37:45,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +16: [2023-05-10 12:37:45,018] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt... +30: [2023-05-10 12:37:45,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. + 0: [2023-05-10 12:37:45,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +18: [2023-05-10 12:37:45,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. + 0: [2023-05-10 12:37:45,019] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt... +18: [2023-05-10 12:37:45,019] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt... + 6: [2023-05-10 12:37:45,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +16: [2023-05-10 12:37:45,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. + 0: [2023-05-10 12:37:45,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +16: [2023-05-10 12:37:45,019] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt... +15: [2023-05-10 12:37:45,019] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt... +29: [2023-05-10 12:37:45,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. + 0: [2023-05-10 12:37:45,019] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt... +30: [2023-05-10 12:37:45,019] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt... +31: [2023-05-10 12:37:45,020] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. + 6: [2023-05-10 12:37:45,020] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt... + 6: [2023-05-10 12:37:45,020] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. + 6: [2023-05-10 12:37:45,020] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt... +31: [2023-05-10 12:37:45,020] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt... +31: [2023-05-10 12:37:45,021] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +31: [2023-05-10 12:37:45,021] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt... + 6: [2023-05-10 12:37:45,021] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. + 6: [2023-05-10 12:37:45,021] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt... + 1: [2023-05-10 12:37:45,022] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +31: [2023-05-10 12:37:45,022] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. + 1: [2023-05-10 12:37:45,023] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +31: [2023-05-10 12:37:45,023] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt... + 1: [2023-05-10 12:37:45,023] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... + 1: [2023-05-10 12:37:45,024] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +29: [2023-05-10 12:37:45,024] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +29: [2023-05-10 12:37:45,025] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... + 6: [2023-05-10 12:37:45,025] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. + 6: [2023-05-10 12:37:45,025] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt... +31: [2023-05-10 12:37:45,026] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. + 0: [2023-05-10 12:37:45,026] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. + 0: [2023-05-10 12:37:45,026] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt... +10: [2023-05-10 12:37:45,027] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt. +10: [2023-05-10 12:37:45,027] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt. +10: [2023-05-10 12:37:45,027] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt. +31: [2023-05-10 12:37:45,027] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt... + 3: [2023-05-10 12:37:45,028] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +10: [2023-05-10 12:37:45,028] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt. +29: [2023-05-10 12:37:45,028] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... + 3: [2023-05-10 12:37:45,029] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt... + 3: [2023-05-10 12:37:45,030] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. + 3: [2023-05-10 12:37:45,030] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt... +18: [2023-05-10 12:37:45,031] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +18: [2023-05-10 12:37:45,032] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt... + 3: [2023-05-10 12:37:45,033] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. + 3: [2023-05-10 12:37:45,033] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt... +10: [2023-05-10 12:37:45,036] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +10: [2023-05-10 12:37:45,036] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... + 7: [2023-05-10 12:37:45,037] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. + 7: [2023-05-10 12:37:45,037] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... + 7: [2023-05-10 12:37:45,037] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. + 7: [2023-05-10 12:37:45,037] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. + 7: [2023-05-10 12:37:45,037] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. + 7: [2023-05-10 12:37:45,037] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... + 7: [2023-05-10 12:37:45,037] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +10: [2023-05-10 12:37:45,038] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... + 7: [2023-05-10 12:37:45,039] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +10: [2023-05-10 12:37:45,039] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... + 3: [2023-05-10 12:37:45,041] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. + 3: [2023-05-10 12:37:45,042] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt... + 7: [2023-05-10 12:37:45,049] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +10: [2023-05-10 12:37:45,052] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +10: [2023-05-10 12:37:45,053] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +10: [2023-05-10 12:37:45,053] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +10: [2023-05-10 12:37:45,053] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt... +10: [2023-05-10 12:37:45,053] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt... +10: [2023-05-10 12:37:45,053] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt... + 7: [2023-05-10 12:37:45,056] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. + 7: [2023-05-10 12:37:45,056] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. + 7: [2023-05-10 12:37:45,057] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +10: [2023-05-10 12:37:45,059] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +10: [2023-05-10 12:37:45,059] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt... +14: [2023-05-10 12:37:45,062] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt. +14: [2023-05-10 12:37:45,062] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt. +14: [2023-05-10 12:37:45,062] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt. +14: [2023-05-10 12:37:45,062] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt. + 9: [2023-05-10 12:37:45,063] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt. + 9: [2023-05-10 12:37:45,063] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt. + 7: [2023-05-10 12:37:45,065] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... + 9: [2023-05-10 12:37:45,065] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt. + 7: [2023-05-10 12:37:45,066] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... + 9: [2023-05-10 12:37:45,066] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt. + 4: [2023-05-10 12:37:45,068] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt. + 4: [2023-05-10 12:37:45,068] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt. + 4: [2023-05-10 12:37:45,068] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt. + 4: [2023-05-10 12:37:45,068] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt. +26: [2023-05-10 12:37:45,068] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt. +26: [2023-05-10 12:37:45,068] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt. +26: [2023-05-10 12:37:45,069] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt. +26: [2023-05-10 12:37:45,070] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt. + 7: [2023-05-10 12:37:45,070] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +14: [2023-05-10 12:37:45,071] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +12: [2023-05-10 12:37:45,071] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt. +12: [2023-05-10 12:37:45,071] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt. +12: [2023-05-10 12:37:45,071] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt. +12: [2023-05-10 12:37:45,071] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt. +24: [2023-05-10 12:37:45,072] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +24: [2023-05-10 12:37:45,072] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +24: [2023-05-10 12:37:45,072] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +24: [2023-05-10 12:37:45,072] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +24: [2023-05-10 12:37:45,072] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +24: [2023-05-10 12:37:45,072] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +14: [2023-05-10 12:37:45,072] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +24: [2023-05-10 12:37:45,072] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +14: [2023-05-10 12:37:45,072] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... + 2: [2023-05-10 12:37:45,073] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt. + 2: [2023-05-10 12:37:45,073] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt. + 2: [2023-05-10 12:37:45,073] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt. +17: [2023-05-10 12:37:45,073] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt. +17: [2023-05-10 12:37:45,073] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt. +17: [2023-05-10 12:37:45,073] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt. + 9: [2023-05-10 12:37:45,073] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... + 2: [2023-05-10 12:37:45,073] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt. +17: [2023-05-10 12:37:45,073] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt. +14: [2023-05-10 12:37:45,074] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +24: [2023-05-10 12:37:45,074] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... + 9: [2023-05-10 12:37:45,075] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... + 9: [2023-05-10 12:37:45,075] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... + 9: [2023-05-10 12:37:45,076] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... + 4: [2023-05-10 12:37:45,077] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... + 4: [2023-05-10 12:37:45,077] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... + 4: [2023-05-10 12:37:45,077] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... + 7: [2023-05-10 12:37:45,079] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... + 4: [2023-05-10 12:37:45,079] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +26: [2023-05-10 12:37:45,079] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... + 1: [2023-05-10 12:37:45,080] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt. +26: [2023-05-10 12:37:45,080] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... + 1: [2023-05-10 12:37:45,080] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt. + 1: [2023-05-10 12:37:45,080] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt. + 1: [2023-05-10 12:37:45,080] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt. +26: [2023-05-10 12:37:45,080] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +12: [2023-05-10 12:37:45,080] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +26: [2023-05-10 12:37:45,080] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +12: [2023-05-10 12:37:45,082] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... + 2: [2023-05-10 12:37:45,082] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... + 2: [2023-05-10 12:37:45,082] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... + 2: [2023-05-10 12:37:45,082] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +12: [2023-05-10 12:37:45,083] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +24: [2023-05-10 12:37:45,083] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt. +24: [2023-05-10 12:37:45,083] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt. +17: [2023-05-10 12:37:45,083] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +24: [2023-05-10 12:37:45,083] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt. +12: [2023-05-10 12:37:45,083] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +13: [2023-05-10 12:37:45,083] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt. +13: [2023-05-10 12:37:45,083] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt. +17: [2023-05-10 12:37:45,084] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +17: [2023-05-10 12:37:45,084] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +13: [2023-05-10 12:37:45,084] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt. +24: [2023-05-10 12:37:45,084] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt. + 2: [2023-05-10 12:37:45,084] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +13: [2023-05-10 12:37:45,084] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt. +24: [2023-05-10 12:37:45,084] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. + 4: [2023-05-10 12:37:45,085] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. + 4: [2023-05-10 12:37:45,085] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. + 4: [2023-05-10 12:37:45,085] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... + 4: [2023-05-10 12:37:45,085] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +17: [2023-05-10 12:37:45,085] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... + 4: [2023-05-10 12:37:45,086] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. + 4: [2023-05-10 12:37:45,087] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... + 4: [2023-05-10 12:37:45,087] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... + 4: [2023-05-10 12:37:45,087] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... + 9: [2023-05-10 12:37:45,088] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. + 9: [2023-05-10 12:37:45,088] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt... +24: [2023-05-10 12:37:45,089] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +24: [2023-05-10 12:37:45,089] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. + 1: [2023-05-10 12:37:45,089] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... + 9: [2023-05-10 12:37:45,089] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. + 9: [2023-05-10 12:37:45,090] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt... + 1: [2023-05-10 12:37:45,090] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... + 1: [2023-05-10 12:37:45,090] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... + 1: [2023-05-10 12:37:45,091] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +12: [2023-05-10 12:37:45,092] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +12: [2023-05-10 12:37:45,092] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt... + 4: [2023-05-10 12:37:45,093] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +13: [2023-05-10 12:37:45,093] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +24: [2023-05-10 12:37:45,093] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +13: [2023-05-10 12:37:45,093] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... + 4: [2023-05-10 12:37:45,093] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt... +24: [2023-05-10 12:37:45,094] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +13: [2023-05-10 12:37:45,095] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +13: [2023-05-10 12:37:45,095] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +24: [2023-05-10 12:37:45,096] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +24: [2023-05-10 12:37:45,096] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +12: [2023-05-10 12:37:45,096] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +12: [2023-05-10 12:37:45,096] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt... + 2: [2023-05-10 12:37:45,096] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. + 2: [2023-05-10 12:37:45,097] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt... +24: [2023-05-10 12:37:45,097] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... + 2: [2023-05-10 12:37:45,098] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. + 4: [2023-05-10 12:37:45,098] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. + 2: [2023-05-10 12:37:45,098] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt... + 4: [2023-05-10 12:37:45,098] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt... + 9: [2023-05-10 12:37:45,098] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. + 9: [2023-05-10 12:37:45,098] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt... +17: [2023-05-10 12:37:45,098] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +17: [2023-05-10 12:37:45,098] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt... +22: [2023-05-10 12:37:45,099] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt. + 4: [2023-05-10 12:37:45,099] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. + 4: [2023-05-10 12:37:45,099] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt... +22: [2023-05-10 12:37:45,099] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt. +22: [2023-05-10 12:37:45,099] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt. +21: [2023-05-10 12:37:45,099] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt. +22: [2023-05-10 12:37:45,099] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt. +21: [2023-05-10 12:37:45,099] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt. +21: [2023-05-10 12:37:45,099] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt. + 7: [2023-05-10 12:37:45,099] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt. + 7: [2023-05-10 12:37:45,100] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt. + 7: [2023-05-10 12:37:45,100] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt. +21: [2023-05-10 12:37:45,100] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt. +20: [2023-05-10 12:37:45,100] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt. +20: [2023-05-10 12:37:45,100] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt. +24: [2023-05-10 12:37:45,100] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +27: [2023-05-10 12:37:45,100] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt. + 7: [2023-05-10 12:37:45,100] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt. +27: [2023-05-10 12:37:45,100] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt. +27: [2023-05-10 12:37:45,100] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt. +27: [2023-05-10 12:37:45,100] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt. +20: [2023-05-10 12:37:45,100] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt. +25: [2023-05-10 12:37:45,100] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt. +25: [2023-05-10 12:37:45,101] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt. +25: [2023-05-10 12:37:45,101] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt. +20: [2023-05-10 12:37:45,101] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt. +25: [2023-05-10 12:37:45,101] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt. + 4: [2023-05-10 12:37:45,101] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. + 2: [2023-05-10 12:37:45,101] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +23: [2023-05-10 12:37:45,102] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt. +23: [2023-05-10 12:37:45,102] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt. +23: [2023-05-10 12:37:45,102] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt. + 2: [2023-05-10 12:37:45,102] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +17: [2023-05-10 12:37:45,102] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. + 2: [2023-05-10 12:37:45,102] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt... +17: [2023-05-10 12:37:45,102] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt... + 9: [2023-05-10 12:37:45,102] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +23: [2023-05-10 12:37:45,102] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_24-model_01-model_states.pt. +17: [2023-05-10 12:37:45,102] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +17: [2023-05-10 12:37:45,102] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt... + 2: [2023-05-10 12:37:45,103] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt... +24: [2023-05-10 12:37:45,103] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... + 9: [2023-05-10 12:37:45,103] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt... + 1: [2023-05-10 12:37:45,104] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. + 1: [2023-05-10 12:37:45,105] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt... +13: [2023-05-10 12:37:45,106] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. + 1: [2023-05-10 12:37:45,106] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. + 1: [2023-05-10 12:37:45,106] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt... +13: [2023-05-10 12:37:45,107] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt... +13: [2023-05-10 12:37:45,107] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +13: [2023-05-10 12:37:45,107] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt... +12: [2023-05-10 12:37:45,107] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +12: [2023-05-10 12:37:45,107] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +12: [2023-05-10 12:37:45,108] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt... + 7: [2023-05-10 12:37:45,108] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +12: [2023-05-10 12:37:45,108] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt... +22: [2023-05-10 12:37:45,109] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +27: [2023-05-10 12:37:45,109] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... + 7: [2023-05-10 12:37:45,109] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... + 7: [2023-05-10 12:37:45,109] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +21: [2023-05-10 12:37:45,109] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +24: [2023-05-10 12:37:45,109] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +21: [2023-05-10 12:37:45,109] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +20: [2023-05-10 12:37:45,109] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +22: [2023-05-10 12:37:45,109] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +22: [2023-05-10 12:37:45,109] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +27: [2023-05-10 12:37:45,109] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +27: [2023-05-10 12:37:45,109] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +22: [2023-05-10 12:37:45,109] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +21: [2023-05-10 12:37:45,109] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +27: [2023-05-10 12:37:45,109] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +21: [2023-05-10 12:37:45,110] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... + 1: [2023-05-10 12:37:45,110] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. + 1: [2023-05-10 12:37:45,110] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt... +24: [2023-05-10 12:37:45,110] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +13: [2023-05-10 12:37:45,110] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +20: [2023-05-10 12:37:45,110] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +25: [2023-05-10 12:37:45,110] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +25: [2023-05-10 12:37:45,110] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... + 4: [2023-05-10 12:37:45,110] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. + 4: [2023-05-10 12:37:45,111] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... + 7: [2023-05-10 12:37:45,111] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +24: [2023-05-10 12:37:45,111] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt... +24: [2023-05-10 12:37:45,111] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +24: [2023-05-10 12:37:45,111] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt... +20: [2023-05-10 12:37:45,111] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +13: [2023-05-10 12:37:45,112] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt... + 4: [2023-05-10 12:37:45,112] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt... +20: [2023-05-10 12:37:45,112] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +23: [2023-05-10 12:37:45,113] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +23: [2023-05-10 12:37:45,113] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +23: [2023-05-10 12:37:45,113] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... + 4: [2023-05-10 12:37:45,114] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +25: [2023-05-10 12:37:45,115] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +25: [2023-05-10 12:37:45,115] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... +23: [2023-05-10 12:37:45,115] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt... + 4: [2023-05-10 12:37:45,115] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +17: [2023-05-10 12:37:45,116] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +24: [2023-05-10 12:37:45,116] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +24: [2023-05-10 12:37:45,117] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt... +17: [2023-05-10 12:37:45,118] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt... + 9: [2023-05-10 12:37:45,118] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. + 9: [2023-05-10 12:37:45,118] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. + 9: [2023-05-10 12:37:45,118] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +13: [2023-05-10 12:37:45,118] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. + 9: [2023-05-10 12:37:45,119] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +24: [2023-05-10 12:37:45,119] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... + 1: [2023-05-10 12:37:45,118] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. + 9: [2023-05-10 12:37:45,119] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. + 9: [2023-05-10 12:37:45,119] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +13: [2023-05-10 12:37:45,120] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt... + 1: [2023-05-10 12:37:45,120] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt... +22: [2023-05-10 12:37:45,121] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. + 9: [2023-05-10 12:37:45,121] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... + 4: [2023-05-10 12:37:45,121] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +20: [2023-05-10 12:37:45,121] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +22: [2023-05-10 12:37:45,121] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt... +20: [2023-05-10 12:37:45,122] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt... + 9: [2023-05-10 12:37:45,122] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +25: [2023-05-10 12:37:45,122] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +25: [2023-05-10 12:37:45,122] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt... +25: [2023-05-10 12:37:45,122] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +25: [2023-05-10 12:37:45,123] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt... +27: [2023-05-10 12:37:45,123] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +20: [2023-05-10 12:37:45,123] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +20: [2023-05-10 12:37:45,123] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt... +27: [2023-05-10 12:37:45,123] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt... + 4: [2023-05-10 12:37:45,124] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +21: [2023-05-10 12:37:45,124] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +27: [2023-05-10 12:37:45,124] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +20: [2023-05-10 12:37:45,124] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +27: [2023-05-10 12:37:45,124] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt... +21: [2023-05-10 12:37:45,124] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +20: [2023-05-10 12:37:45,124] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt... + 7: [2023-05-10 12:37:45,124] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. + 4: [2023-05-10 12:37:45,125] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +21: [2023-05-10 12:37:45,125] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt... +21: [2023-05-10 12:37:45,125] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt... + 7: [2023-05-10 12:37:45,125] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt... +21: [2023-05-10 12:37:45,125] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +21: [2023-05-10 12:37:45,125] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt... + 7: [2023-05-10 12:37:45,127] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. + 7: [2023-05-10 12:37:45,128] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt... +21: [2023-05-10 12:37:45,128] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +21: [2023-05-10 12:37:45,128] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt... +22: [2023-05-10 12:37:45,128] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +22: [2023-05-10 12:37:45,128] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +22: [2023-05-10 12:37:45,128] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt... +22: [2023-05-10 12:37:45,129] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt... +23: [2023-05-10 12:37:45,128] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. + 7: [2023-05-10 12:37:45,128] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. + 7: [2023-05-10 12:37:45,129] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt... +27: [2023-05-10 12:37:45,129] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +23: [2023-05-10 12:37:45,129] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +23: [2023-05-10 12:37:45,129] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +23: [2023-05-10 12:37:45,129] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt... +23: [2023-05-10 12:37:45,129] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt... +23: [2023-05-10 12:37:45,129] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt... + 9: [2023-05-10 12:37:45,130] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +24: [2023-05-10 12:37:45,130] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. + 7: [2023-05-10 12:37:45,130] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. + 7: [2023-05-10 12:37:45,130] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt... +27: [2023-05-10 12:37:45,130] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt... + 4: [2023-05-10 12:37:45,130] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +27: [2023-05-10 12:37:45,130] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +27: [2023-05-10 12:37:45,131] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt... +20: [2023-05-10 12:37:45,131] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +24: [2023-05-10 12:37:45,132] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt... +20: [2023-05-10 12:37:45,132] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt... +25: [2023-05-10 12:37:45,133] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +25: [2023-05-10 12:37:45,133] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt... +22: [2023-05-10 12:37:45,134] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +22: [2023-05-10 12:37:45,134] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt... +25: [2023-05-10 12:37:45,138] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +25: [2023-05-10 12:37:45,139] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt... + 9: [2023-05-10 12:37:45,141] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... + 9: [2023-05-10 12:37:45,142] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +23: [2023-05-10 12:37:45,144] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_00-model_states.pt. +23: [2023-05-10 12:37:45,146] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt... + 9: [2023-05-10 12:37:45,149] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. + 9: [2023-05-10 12:37:45,150] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... + 9: [2023-05-10 12:37:45,151] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. + 9: [2023-05-10 12:37:45,158] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +28: [2023-05-10 12:37:45,158] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +28: [2023-05-10 12:37:45,158] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +28: [2023-05-10 12:37:45,158] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +28: [2023-05-10 12:37:45,158] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +28: [2023-05-10 12:37:45,158] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +28: [2023-05-10 12:37:45,158] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +28: [2023-05-10 12:37:45,158] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +10: [2023-05-10 12:37:45,159] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +10: [2023-05-10 12:37:45,159] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +10: [2023-05-10 12:37:45,159] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +10: [2023-05-10 12:37:45,159] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +10: [2023-05-10 12:37:45,159] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +10: [2023-05-10 12:37:45,159] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +10: [2023-05-10 12:37:45,159] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +10: [2023-05-10 12:37:45,159] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +28: [2023-05-10 12:37:45,160] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... + 9: [2023-05-10 12:37:45,160] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +31: [2023-05-10 12:37:45,160] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +31: [2023-05-10 12:37:45,160] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +31: [2023-05-10 12:37:45,160] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +31: [2023-05-10 12:37:45,160] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +31: [2023-05-10 12:37:45,160] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +31: [2023-05-10 12:37:45,160] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +31: [2023-05-10 12:37:45,161] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +31: [2023-05-10 12:37:45,161] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +28: [2023-05-10 12:37:45,170] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +10: [2023-05-10 12:37:45,171] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +31: [2023-05-10 12:37:45,172] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +31: [2023-05-10 12:37:45,173] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +19: [2023-05-10 12:37:45,173] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt. +19: [2023-05-10 12:37:45,173] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt. +19: [2023-05-10 12:37:45,173] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt. +19: [2023-05-10 12:37:45,174] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt. +10: [2023-05-10 12:37:45,176] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +31: [2023-05-10 12:37:45,176] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +31: [2023-05-10 12:37:45,176] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +28: [2023-05-10 12:37:45,177] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +10: [2023-05-10 12:37:45,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +28: [2023-05-10 12:37:45,180] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +10: [2023-05-10 12:37:45,181] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +10: [2023-05-10 12:37:45,182] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +28: [2023-05-10 12:37:45,183] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +11: [2023-05-10 12:37:45,183] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt. +31: [2023-05-10 12:37:45,183] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +11: [2023-05-10 12:37:45,183] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt. +11: [2023-05-10 12:37:45,183] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt. +11: [2023-05-10 12:37:45,183] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt. +19: [2023-05-10 12:37:45,184] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... + 6: [2023-05-10 12:37:45,184] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. + 6: [2023-05-10 12:37:45,184] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... + 6: [2023-05-10 12:37:45,184] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. + 6: [2023-05-10 12:37:45,184] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. + 6: [2023-05-10 12:37:45,184] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... + 6: [2023-05-10 12:37:45,184] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... + 6: [2023-05-10 12:37:45,184] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +31: [2023-05-10 12:37:45,184] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +12: [2023-05-10 12:37:45,184] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +12: [2023-05-10 12:37:45,184] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +12: [2023-05-10 12:37:45,184] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +12: [2023-05-10 12:37:45,184] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +12: [2023-05-10 12:37:45,184] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +12: [2023-05-10 12:37:45,185] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +19: [2023-05-10 12:37:45,185] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +19: [2023-05-10 12:37:45,185] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... + 6: [2023-05-10 12:37:45,186] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +31: [2023-05-10 12:37:45,186] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +12: [2023-05-10 12:37:45,186] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +10: [2023-05-10 12:37:45,186] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +28: [2023-05-10 12:37:45,186] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +12: [2023-05-10 12:37:45,186] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +19: [2023-05-10 12:37:45,186] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +31: [2023-05-10 12:37:45,187] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +28: [2023-05-10 12:37:45,190] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +28: [2023-05-10 12:37:45,191] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +10: [2023-05-10 12:37:45,191] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +10: [2023-05-10 12:37:45,191] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +11: [2023-05-10 12:37:45,194] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +11: [2023-05-10 12:37:45,194] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +11: [2023-05-10 12:37:45,194] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +11: [2023-05-10 12:37:45,194] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +12: [2023-05-10 12:37:45,198] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +28: [2023-05-10 12:37:45,199] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +12: [2023-05-10 12:37:45,204] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. + 6: [2023-05-10 12:37:45,204] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. + 6: [2023-05-10 12:37:45,206] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. + 5: [2023-05-10 12:37:45,207] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt. + 5: [2023-05-10 12:37:45,207] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt. + 5: [2023-05-10 12:37:45,207] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt. + 5: [2023-05-10 12:37:45,207] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt. +12: [2023-05-10 12:37:45,209] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +12: [2023-05-10 12:37:45,211] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. + 6: [2023-05-10 12:37:45,211] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +12: [2023-05-10 12:37:45,211] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +12: [2023-05-10 12:37:45,213] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... + 6: [2023-05-10 12:37:45,214] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. + 3: [2023-05-10 12:37:45,214] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. + 3: [2023-05-10 12:37:45,214] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... + 3: [2023-05-10 12:37:45,214] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. + 3: [2023-05-10 12:37:45,215] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... + 3: [2023-05-10 12:37:45,215] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. + 3: [2023-05-10 12:37:45,215] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. + 3: [2023-05-10 12:37:45,215] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... + 6: [2023-05-10 12:37:45,215] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... + 3: [2023-05-10 12:37:45,216] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... + 5: [2023-05-10 12:37:45,217] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... + 5: [2023-05-10 12:37:45,218] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... + 5: [2023-05-10 12:37:45,218] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... + 6: [2023-05-10 12:37:45,218] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... + 5: [2023-05-10 12:37:45,219] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +12: [2023-05-10 12:37:45,220] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... + 6: [2023-05-10 12:37:45,220] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +12: [2023-05-10 12:37:45,220] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +17: [2023-05-10 12:37:45,220] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +17: [2023-05-10 12:37:45,220] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +17: [2023-05-10 12:37:45,220] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +26: [2023-05-10 12:37:45,221] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +26: [2023-05-10 12:37:45,221] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +26: [2023-05-10 12:37:45,221] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +26: [2023-05-10 12:37:45,221] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +26: [2023-05-10 12:37:45,221] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +17: [2023-05-10 12:37:45,221] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +17: [2023-05-10 12:37:45,221] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +26: [2023-05-10 12:37:45,221] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +26: [2023-05-10 12:37:45,221] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +17: [2023-05-10 12:37:45,221] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +26: [2023-05-10 12:37:45,221] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt... +26: [2023-05-10 12:37:45,221] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +26: [2023-05-10 12:37:45,221] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt... +26: [2023-05-10 12:37:45,221] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt... +23: [2023-05-10 12:37:45,221] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +26: [2023-05-10 12:37:45,221] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt... +23: [2023-05-10 12:37:45,221] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +23: [2023-05-10 12:37:45,221] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +23: [2023-05-10 12:37:45,221] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +23: [2023-05-10 12:37:45,221] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +23: [2023-05-10 12:37:45,222] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +23: [2023-05-10 12:37:45,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +17: [2023-05-10 12:37:45,222] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... + 6: [2023-05-10 12:37:45,222] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +23: [2023-05-10 12:37:45,223] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +17: [2023-05-10 12:37:45,223] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... + 2: [2023-05-10 12:37:45,223] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. + 5: [2023-05-10 12:37:45,223] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. + 5: [2023-05-10 12:37:45,223] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. + 2: [2023-05-10 12:37:45,223] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... + 2: [2023-05-10 12:37:45,223] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. + 2: [2023-05-10 12:37:45,223] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. + 2: [2023-05-10 12:37:45,223] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +21: [2023-05-10 12:37:45,223] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. + 5: [2023-05-10 12:37:45,223] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +21: [2023-05-10 12:37:45,223] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... + 2: [2023-05-10 12:37:45,223] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. + 2: [2023-05-10 12:37:45,223] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +21: [2023-05-10 12:37:45,223] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +16: [2023-05-10 12:37:45,223] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +25: [2023-05-10 12:37:45,223] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +16: [2023-05-10 12:37:45,224] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +21: [2023-05-10 12:37:45,224] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +21: [2023-05-10 12:37:45,224] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +16: [2023-05-10 12:37:45,224] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +21: [2023-05-10 12:37:45,224] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +21: [2023-05-10 12:37:45,224] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +21: [2023-05-10 12:37:45,224] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +25: [2023-05-10 12:37:45,224] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +25: [2023-05-10 12:37:45,224] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +25: [2023-05-10 12:37:45,224] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +25: [2023-05-10 12:37:45,224] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... + 5: [2023-05-10 12:37:45,224] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. + 5: [2023-05-10 12:37:45,224] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +25: [2023-05-10 12:37:45,224] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +25: [2023-05-10 12:37:45,224] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. + 5: [2023-05-10 12:37:45,224] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... + 5: [2023-05-10 12:37:45,224] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +16: [2023-05-10 12:37:45,224] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +16: [2023-05-10 12:37:45,224] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. + 5: [2023-05-10 12:37:45,224] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... + 2: [2023-05-10 12:37:45,225] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +25: [2023-05-10 12:37:45,225] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +16: [2023-05-10 12:37:45,225] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +16: [2023-05-10 12:37:45,226] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +16: [2023-05-10 12:37:45,226] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +19: [2023-05-10 12:37:45,226] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. + 3: [2023-05-10 12:37:45,226] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +19: [2023-05-10 12:37:45,226] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +19: [2023-05-10 12:37:45,226] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +19: [2023-05-10 12:37:45,226] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +19: [2023-05-10 12:37:45,226] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +19: [2023-05-10 12:37:45,226] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +19: [2023-05-10 12:37:45,226] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +19: [2023-05-10 12:37:45,226] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +19: [2023-05-10 12:37:45,227] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +19: [2023-05-10 12:37:45,227] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +19: [2023-05-10 12:37:45,227] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +19: [2023-05-10 12:37:45,227] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt... + 0: [2023-05-10 12:37:45,227] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. + 0: [2023-05-10 12:37:45,227] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. + 0: [2023-05-10 12:37:45,227] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. + 0: [2023-05-10 12:37:45,227] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... + 0: [2023-05-10 12:37:45,227] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +11: [2023-05-10 12:37:45,227] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +11: [2023-05-10 12:37:45,227] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +11: [2023-05-10 12:37:45,227] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +11: [2023-05-10 12:37:45,227] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +11: [2023-05-10 12:37:45,227] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +11: [2023-05-10 12:37:45,227] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +11: [2023-05-10 12:37:45,227] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +11: [2023-05-10 12:37:45,227] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +11: [2023-05-10 12:37:45,227] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +11: [2023-05-10 12:37:45,227] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +11: [2023-05-10 12:37:45,227] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +11: [2023-05-10 12:37:45,227] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. + 0: [2023-05-10 12:37:45,227] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +19: [2023-05-10 12:37:45,228] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt... + 0: [2023-05-10 12:37:45,228] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +11: [2023-05-10 12:37:45,228] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt... +11: [2023-05-10 12:37:45,228] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt... +11: [2023-05-10 12:37:45,228] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt... +11: [2023-05-10 12:37:45,228] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt... +19: [2023-05-10 12:37:45,229] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt... +19: [2023-05-10 12:37:45,229] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt... + 0: [2023-05-10 12:37:45,229] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +19: [2023-05-10 12:37:45,229] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +30: [2023-05-10 12:37:45,230] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt. +30: [2023-05-10 12:37:45,230] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt. +30: [2023-05-10 12:37:45,230] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt. +30: [2023-05-10 12:37:45,230] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt. +17: [2023-05-10 12:37:45,232] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. + 6: [2023-05-10 12:37:45,232] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt. + 6: [2023-05-10 12:37:45,232] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt. + 6: [2023-05-10 12:37:45,232] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt. + 6: [2023-05-10 12:37:45,232] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt. +23: [2023-05-10 12:37:45,233] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. + 2: [2023-05-10 12:37:45,234] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +25: [2023-05-10 12:37:45,235] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. + 3: [2023-05-10 12:37:45,235] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +23: [2023-05-10 12:37:45,235] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +17: [2023-05-10 12:37:45,235] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +25: [2023-05-10 12:37:45,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. + 3: [2023-05-10 12:37:45,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. + 3: [2023-05-10 12:37:45,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. + 5: [2023-05-10 12:37:45,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. + 5: [2023-05-10 12:37:45,236] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt... + 2: [2023-05-10 12:37:45,237] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. + 2: [2023-05-10 12:37:45,237] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +21: [2023-05-10 12:37:45,237] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +25: [2023-05-10 12:37:45,238] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +21: [2023-05-10 12:37:45,238] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +30: [2023-05-10 12:37:45,239] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... + 5: [2023-05-10 12:37:45,239] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +30: [2023-05-10 12:37:45,240] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +30: [2023-05-10 12:37:45,240] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +30: [2023-05-10 12:37:45,240] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... + 5: [2023-05-10 12:37:45,241] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt... +21: [2023-05-10 12:37:45,241] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +19: [2023-05-10 12:37:45,241] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +19: [2023-05-10 12:37:45,241] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +21: [2023-05-10 12:37:45,242] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +11: [2023-05-10 12:37:45,242] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +11: [2023-05-10 12:37:45,242] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +11: [2023-05-10 12:37:45,243] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +16: [2023-05-10 12:37:45,242] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +17: [2023-05-10 12:37:45,243] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... + 3: [2023-05-10 12:37:45,243] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt. + 6: [2023-05-10 12:37:45,243] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... + 6: [2023-05-10 12:37:45,243] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... + 6: [2023-05-10 12:37:45,243] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... + 5: [2023-05-10 12:37:45,243] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. + 3: [2023-05-10 12:37:45,243] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt. + 3: [2023-05-10 12:37:45,244] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt. +17: [2023-05-10 12:37:45,244] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +23: [2023-05-10 12:37:45,244] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +23: [2023-05-10 12:37:45,244] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +23: [2023-05-10 12:37:45,245] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +25: [2023-05-10 12:37:45,245] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +25: [2023-05-10 12:37:45,245] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +17: [2023-05-10 12:37:45,245] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +19: [2023-05-10 12:37:45,245] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. + 2: [2023-05-10 12:37:45,246] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +23: [2023-05-10 12:37:45,246] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. + 6: [2023-05-10 12:37:45,246] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... + 3: [2023-05-10 12:37:45,246] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... + 3: [2023-05-10 12:37:45,246] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... + 5: [2023-05-10 12:37:45,247] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. + 5: [2023-05-10 12:37:45,247] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt... +14: [2023-05-10 12:37:45,247] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +14: [2023-05-10 12:37:45,248] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt... +25: [2023-05-10 12:37:45,248] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... + 2: [2023-05-10 12:37:45,248] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... + 3: [2023-05-10 12:37:45,248] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt. +14: [2023-05-10 12:37:45,248] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +14: [2023-05-10 12:37:45,249] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +21: [2023-05-10 12:37:45,248] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +11: [2023-05-10 12:37:45,250] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. + 5: [2023-05-10 12:37:45,250] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +19: [2023-05-10 12:37:45,250] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +16: [2023-05-10 12:37:45,250] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +14: [2023-05-10 12:37:45,251] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +14: [2023-05-10 12:37:45,251] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +14: [2023-05-10 12:37:45,251] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +14: [2023-05-10 12:37:45,251] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +14: [2023-05-10 12:37:45,251] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +14: [2023-05-10 12:37:45,251] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt... +14: [2023-05-10 12:37:45,251] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +22: [2023-05-10 12:37:45,251] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +22: [2023-05-10 12:37:45,251] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +22: [2023-05-10 12:37:45,251] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +22: [2023-05-10 12:37:45,251] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... + 2: [2023-05-10 12:37:45,252] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... + 5: [2023-05-10 12:37:45,252] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. + 2: [2023-05-10 12:37:45,252] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +14: [2023-05-10 12:37:45,252] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +17: [2023-05-10 12:37:45,252] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +14: [2023-05-10 12:37:45,252] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +22: [2023-05-10 12:37:45,252] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +11: [2023-05-10 12:37:45,252] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +22: [2023-05-10 12:37:45,253] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +19: [2023-05-10 12:37:45,253] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +21: [2023-05-10 12:37:45,253] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +21: [2023-05-10 12:37:45,253] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +21: [2023-05-10 12:37:45,253] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +15: [2023-05-10 12:37:45,253] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +15: [2023-05-10 12:37:45,253] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +15: [2023-05-10 12:37:45,253] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +14: [2023-05-10 12:37:45,253] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt... +15: [2023-05-10 12:37:45,253] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +16: [2023-05-10 12:37:45,253] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +22: [2023-05-10 12:37:45,253] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. + 5: [2023-05-10 12:37:45,253] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +11: [2023-05-10 12:37:45,253] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... + 3: [2023-05-10 12:37:45,253] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +14: [2023-05-10 12:37:45,253] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt... + 0: [2023-05-10 12:37:45,253] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. + 0: [2023-05-10 12:37:45,253] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. + 3: [2023-05-10 12:37:45,253] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... + 3: [2023-05-10 12:37:45,253] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +14: [2023-05-10 12:37:45,253] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +25: [2023-05-10 12:37:45,253] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +23: [2023-05-10 12:37:45,254] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +15: [2023-05-10 12:37:45,254] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +23: [2023-05-10 12:37:45,254] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +16: [2023-05-10 12:37:45,254] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +15: [2023-05-10 12:37:45,254] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +19: [2023-05-10 12:37:45,255] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +11: [2023-05-10 12:37:45,255] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +22: [2023-05-10 12:37:45,255] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +17: [2023-05-10 12:37:45,255] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. + 3: [2023-05-10 12:37:45,255] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +18: [2023-05-10 12:37:45,255] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +18: [2023-05-10 12:37:45,255] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +18: [2023-05-10 12:37:45,255] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +18: [2023-05-10 12:37:45,255] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +16: [2023-05-10 12:37:45,255] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +18: [2023-05-10 12:37:45,255] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +18: [2023-05-10 12:37:45,255] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +15: [2023-05-10 12:37:45,256] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... + 5: [2023-05-10 12:37:45,256] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. + 5: [2023-05-10 12:37:45,257] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt... +18: [2023-05-10 12:37:45,257] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +18: [2023-05-10 12:37:45,257] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +15: [2023-05-10 12:37:45,257] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +19: [2023-05-10 12:37:45,258] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. + 3: [2023-05-10 12:37:45,258] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... + 6: [2023-05-10 12:37:45,258] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +11: [2023-05-10 12:37:45,259] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... + 6: [2023-05-10 12:37:45,259] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt... + 5: [2023-05-10 12:37:45,259] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +16: [2023-05-10 12:37:45,259] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... + 0: [2023-05-10 12:37:45,260] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. + 8: [2023-05-10 12:37:45,260] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +20: [2023-05-10 12:37:45,260] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +20: [2023-05-10 12:37:45,260] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. + 8: [2023-05-10 12:37:45,260] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +14: [2023-05-10 12:37:45,260] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +20: [2023-05-10 12:37:45,260] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +20: [2023-05-10 12:37:45,260] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +20: [2023-05-10 12:37:45,260] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +20: [2023-05-10 12:37:45,261] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +20: [2023-05-10 12:37:45,260] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. + 8: [2023-05-10 12:37:45,261] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. + 8: [2023-05-10 12:37:45,261] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. + 8: [2023-05-10 12:37:45,261] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... + 8: [2023-05-10 12:37:45,261] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... + 6: [2023-05-10 12:37:45,261] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. + 5: [2023-05-10 12:37:45,261] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. + 6: [2023-05-10 12:37:45,261] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt... + 2: [2023-05-10 12:37:45,261] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... + 5: [2023-05-10 12:37:45,261] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +20: [2023-05-10 12:37:45,262] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... + 0: [2023-05-10 12:37:45,262] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... + 8: [2023-05-10 12:37:45,263] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. + 8: [2023-05-10 12:37:45,263] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... + 6: [2023-05-10 12:37:45,263] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. + 6: [2023-05-10 12:37:45,263] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt... +25: [2023-05-10 12:37:45,264] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +17: [2023-05-10 12:37:45,264] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... + 6: [2023-05-10 12:37:45,264] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. + 6: [2023-05-10 12:37:45,264] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt... +16: [2023-05-10 12:37:45,264] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... + 3: [2023-05-10 12:37:45,264] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +26: [2023-05-10 12:37:45,221] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +26: [2023-05-10 12:37:45,222] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +26: [2023-05-10 12:37:45,222] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +26: [2023-05-10 12:37:45,223] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +26: [2023-05-10 12:37:45,232] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +26: [2023-05-10 12:37:45,235] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +26: [2023-05-10 12:37:45,240] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +26: [2023-05-10 12:37:45,245] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +26: [2023-05-10 12:37:45,246] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +26: [2023-05-10 12:37:45,250] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +26: [2023-05-10 12:37:45,255] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +26: [2023-05-10 12:37:45,260] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +16: [2023-05-10 12:37:45,265] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... + 0: [2023-05-10 12:37:45,265] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +15: [2023-05-10 12:37:45,265] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +19: [2023-05-10 12:37:45,266] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +15: [2023-05-10 12:37:45,266] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt. + 3: [2023-05-10 12:37:45,267] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +15: [2023-05-10 12:37:45,269] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. + 5: [2023-05-10 12:37:45,269] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +18: [2023-05-10 12:37:45,269] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt. +18: [2023-05-10 12:37:45,269] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt. +15: [2023-05-10 12:37:45,270] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt. + 3: [2023-05-10 12:37:45,270] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt... + 0: [2023-05-10 12:37:45,270] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. + 0: [2023-05-10 12:37:45,271] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +14: [2023-05-10 12:37:45,271] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... + 0: [2023-05-10 12:37:45,271] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt. + 0: [2023-05-10 12:37:45,271] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt. +22: [2023-05-10 12:37:45,271] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. + 0: [2023-05-10 12:37:45,272] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt. +22: [2023-05-10 12:37:45,272] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. + 8: [2023-05-10 12:37:45,272] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. + 3: [2023-05-10 12:37:45,272] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. + 3: [2023-05-10 12:37:45,272] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. + 3: [2023-05-10 12:37:45,272] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt... + 3: [2023-05-10 12:37:45,272] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt... + 3: [2023-05-10 12:37:45,273] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +15: [2023-05-10 12:37:45,273] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt. + 3: [2023-05-10 12:37:45,273] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt... +15: [2023-05-10 12:37:45,274] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt. +20: [2023-05-10 12:37:45,274] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +15: [2023-05-10 12:37:45,274] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +14: [2023-05-10 12:37:45,275] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +29: [2023-05-10 12:37:45,275] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +29: [2023-05-10 12:37:45,276] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +22: [2023-05-10 12:37:45,276] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +29: [2023-05-10 12:37:45,277] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +29: [2023-05-10 12:37:45,277] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt. +29: [2023-05-10 12:37:45,277] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt. +29: [2023-05-10 12:37:45,277] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt. +29: [2023-05-10 12:37:45,277] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +29: [2023-05-10 12:37:45,277] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +29: [2023-05-10 12:37:45,277] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt. +29: [2023-05-10 12:37:45,277] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +15: [2023-05-10 12:37:45,277] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +18: [2023-05-10 12:37:45,278] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +20: [2023-05-10 12:37:45,278] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +20: [2023-05-10 12:37:45,278] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +18: [2023-05-10 12:37:45,278] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +18: [2023-05-10 12:37:45,278] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt. +29: [2023-05-10 12:37:45,278] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +29: [2023-05-10 12:37:45,279] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +14: [2023-05-10 12:37:45,280] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +15: [2023-05-10 12:37:45,280] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... + 0: [2023-05-10 12:37:45,280] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... + 8: [2023-05-10 12:37:45,281] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... + 0: [2023-05-10 12:37:45,281] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt. +22: [2023-05-10 12:37:45,281] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... + 0: [2023-05-10 12:37:45,281] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +14: [2023-05-10 12:37:45,281] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +22: [2023-05-10 12:37:45,281] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... + 8: [2023-05-10 12:37:45,281] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. + 8: [2023-05-10 12:37:45,282] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. + 0: [2023-05-10 12:37:45,282] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +15: [2023-05-10 12:37:45,283] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +15: [2023-05-10 12:37:45,283] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +18: [2023-05-10 12:37:45,283] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt. + 0: [2023-05-10 12:37:45,283] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +18: [2023-05-10 12:37:45,283] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +18: [2023-05-10 12:37:45,283] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +20: [2023-05-10 12:37:45,283] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +15: [2023-05-10 12:37:45,284] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +22: [2023-05-10 12:37:45,284] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +13: [2023-05-10 12:37:45,284] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt. +13: [2023-05-10 12:37:45,284] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt. + 8: [2023-05-10 12:37:45,285] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +13: [2023-05-10 12:37:45,285] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt. +30: [2023-05-10 12:37:45,285] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +30: [2023-05-10 12:37:45,285] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +13: [2023-05-10 12:37:45,285] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt. +14: [2023-05-10 12:37:45,285] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +22: [2023-05-10 12:37:45,286] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +30: [2023-05-10 12:37:45,285] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +30: [2023-05-10 12:37:45,285] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +30: [2023-05-10 12:37:45,286] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +30: [2023-05-10 12:37:45,286] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt... +30: [2023-05-10 12:37:45,286] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt... +30: [2023-05-10 12:37:45,286] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt... +30: [2023-05-10 12:37:45,286] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +30: [2023-05-10 12:37:45,286] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +30: [2023-05-10 12:37:45,286] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +30: [2023-05-10 12:37:45,286] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +30: [2023-05-10 12:37:45,286] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +30: [2023-05-10 12:37:45,286] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +30: [2023-05-10 12:37:45,286] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +29: [2023-05-10 12:37:45,286] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +20: [2023-05-10 12:37:45,287] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +20: [2023-05-10 12:37:45,287] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +30: [2023-05-10 12:37:45,287] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt... +29: [2023-05-10 12:37:45,287] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +20: [2023-05-10 12:37:45,288] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +29: [2023-05-10 12:37:45,288] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +14: [2023-05-10 12:37:45,289] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +29: [2023-05-10 12:37:45,289] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... + 0: [2023-05-10 12:37:45,290] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +18: [2023-05-10 12:37:45,290] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +14: [2023-05-10 12:37:45,291] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... + 8: [2023-05-10 12:37:45,291] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +15: [2023-05-10 12:37:45,291] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +15: [2023-05-10 12:37:45,291] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. + 8: [2023-05-10 12:37:45,293] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +13: [2023-05-10 12:37:45,294] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +22: [2023-05-10 12:37:45,293] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +16: [2023-05-10 12:37:45,293] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt. +16: [2023-05-10 12:37:45,294] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt. +16: [2023-05-10 12:37:45,294] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt. +16: [2023-05-10 12:37:45,294] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt. + 8: [2023-05-10 12:37:45,295] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +18: [2023-05-10 12:37:45,295] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +29: [2023-05-10 12:37:45,294] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +18: [2023-05-10 12:37:45,295] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +18: [2023-05-10 12:37:45,295] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +13: [2023-05-10 12:37:45,296] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +13: [2023-05-10 12:37:45,296] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +18: [2023-05-10 12:37:45,296] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt... +13: [2023-05-10 12:37:45,296] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +20: [2023-05-10 12:37:45,297] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +18: [2023-05-10 12:37:45,297] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt... + 0: [2023-05-10 12:37:45,298] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +30: [2023-05-10 12:37:45,298] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +18: [2023-05-10 12:37:45,298] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +29: [2023-05-10 12:37:45,298] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +18: [2023-05-10 12:37:45,298] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... + 0: [2023-05-10 12:37:45,298] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt... +15: [2023-05-10 12:37:45,301] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +15: [2023-05-10 12:37:45,301] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +15: [2023-05-10 12:37:45,302] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +15: [2023-05-10 12:37:45,302] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +15: [2023-05-10 12:37:45,302] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt... +15: [2023-05-10 12:37:45,302] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt... +15: [2023-05-10 12:37:45,302] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt... +15: [2023-05-10 12:37:45,302] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +16: [2023-05-10 12:37:45,303] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +29: [2023-05-10 12:37:45,304] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +30: [2023-05-10 12:37:45,304] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +30: [2023-05-10 12:37:45,304] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +30: [2023-05-10 12:37:45,304] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. + 0: [2023-05-10 12:37:45,304] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. + 0: [2023-05-10 12:37:45,305] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt... +20: [2023-05-10 12:37:45,305] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt. +20: [2023-05-10 12:37:45,305] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt. +16: [2023-05-10 12:37:45,305] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +16: [2023-05-10 12:37:45,305] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +16: [2023-05-10 12:37:45,305] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +12: [2023-05-10 12:37:45,305] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt. +12: [2023-05-10 12:37:45,306] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt. +18: [2023-05-10 12:37:45,306] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +20: [2023-05-10 12:37:45,306] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt. + 8: [2023-05-10 12:37:45,306] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt. + 8: [2023-05-10 12:37:45,306] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt. + 8: [2023-05-10 12:37:45,306] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt. + 0: [2023-05-10 12:37:45,306] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +20: [2023-05-10 12:37:45,306] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt. + 0: [2023-05-10 12:37:45,306] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt... + 8: [2023-05-10 12:37:45,306] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt. +28: [2023-05-10 12:37:45,306] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt. +28: [2023-05-10 12:37:45,306] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt. +28: [2023-05-10 12:37:45,306] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt. +30: [2023-05-10 12:37:45,306] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +28: [2023-05-10 12:37:45,307] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt. +12: [2023-05-10 12:37:45,307] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt. +15: [2023-05-10 12:37:45,307] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +15: [2023-05-10 12:37:45,307] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt... +18: [2023-05-10 12:37:45,307] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +12: [2023-05-10 12:37:45,307] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt. +17: [2023-05-10 12:37:45,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt. +31: [2023-05-10 12:37:45,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt. +31: [2023-05-10 12:37:45,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt. +31: [2023-05-10 12:37:45,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt. +10: [2023-05-10 12:37:45,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt. +31: [2023-05-10 12:37:45,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt. +10: [2023-05-10 12:37:45,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt. +17: [2023-05-10 12:37:45,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt. +10: [2023-05-10 12:37:45,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt. +10: [2023-05-10 12:37:45,310] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt. + 0: [2023-05-10 12:37:45,310] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +29: [2023-05-10 12:37:45,310] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +29: [2023-05-10 12:37:45,310] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +27: [2023-05-10 12:37:45,310] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt. +27: [2023-05-10 12:37:45,310] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt. +27: [2023-05-10 12:37:45,310] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt. +17: [2023-05-10 12:37:45,310] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt. +27: [2023-05-10 12:37:45,311] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt. +29: [2023-05-10 12:37:45,311] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt... +17: [2023-05-10 12:37:45,311] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt. +29: [2023-05-10 12:37:45,311] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +29: [2023-05-10 12:37:45,311] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt... + 0: [2023-05-10 12:37:45,311] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt... +22: [2023-05-10 12:37:45,311] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt. +22: [2023-05-10 12:37:45,312] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt. +22: [2023-05-10 12:37:45,312] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt. +22: [2023-05-10 12:37:45,312] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt. + 9: [2023-05-10 12:37:45,312] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt. +18: [2023-05-10 12:37:45,312] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. + 9: [2023-05-10 12:37:45,312] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt. + 9: [2023-05-10 12:37:45,312] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt. + 9: [2023-05-10 12:37:45,313] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt. +13: [2023-05-10 12:37:45,313] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +13: [2023-05-10 12:37:45,313] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +13: [2023-05-10 12:37:45,313] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +12: [2023-05-10 12:37:45,315] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +29: [2023-05-10 12:37:45,315] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +18: [2023-05-10 12:37:45,315] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt... +29: [2023-05-10 12:37:45,315] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. + 8: [2023-05-10 12:37:45,315] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +29: [2023-05-10 12:37:45,315] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt... + 8: [2023-05-10 12:37:45,315] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +12: [2023-05-10 12:37:45,315] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +13: [2023-05-10 12:37:45,315] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt... + 8: [2023-05-10 12:37:45,316] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +20: [2023-05-10 12:37:45,316] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +29: [2023-05-10 12:37:45,316] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +30: [2023-05-10 12:37:45,316] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +29: [2023-05-10 12:37:45,316] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt... +30: [2023-05-10 12:37:45,316] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +13: [2023-05-10 12:37:45,316] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +13: [2023-05-10 12:37:45,316] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +13: [2023-05-10 12:37:45,316] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +13: [2023-05-10 12:37:45,316] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +20: [2023-05-10 12:37:45,316] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +13: [2023-05-10 12:37:45,316] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +13: [2023-05-10 12:37:45,317] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt... +13: [2023-05-10 12:37:45,317] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +13: [2023-05-10 12:37:45,317] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt... +12: [2023-05-10 12:37:45,317] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +20: [2023-05-10 12:37:45,317] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +20: [2023-05-10 12:37:45,317] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +18: [2023-05-10 12:37:45,317] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... + 2: [2023-05-10 12:37:45,318] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt. +13: [2023-05-10 12:37:45,318] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... + 2: [2023-05-10 12:37:45,318] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt. +13: [2023-05-10 12:37:45,318] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... + 2: [2023-05-10 12:37:45,318] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt. + 2: [2023-05-10 12:37:45,318] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt. +18: [2023-05-10 12:37:45,318] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +28: [2023-05-10 12:37:45,318] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +28: [2023-05-10 12:37:45,318] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +30: [2023-05-10 12:37:45,318] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +31: [2023-05-10 12:37:45,319] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +31: [2023-05-10 12:37:45,319] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +10: [2023-05-10 12:37:45,319] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +10: [2023-05-10 12:37:45,319] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +31: [2023-05-10 12:37:45,319] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +18: [2023-05-10 12:37:45,319] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +18: [2023-05-10 12:37:45,319] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt... +12: [2023-05-10 12:37:45,319] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +17: [2023-05-10 12:37:45,319] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +16: [2023-05-10 12:37:45,319] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +16: [2023-05-10 12:37:45,319] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +17: [2023-05-10 12:37:45,319] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +10: [2023-05-10 12:37:45,319] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +27: [2023-05-10 12:37:45,320] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +27: [2023-05-10 12:37:45,320] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... + 8: [2023-05-10 12:37:45,320] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +16: [2023-05-10 12:37:45,320] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt... +16: [2023-05-10 12:37:45,320] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt... +27: [2023-05-10 12:37:45,320] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +31: [2023-05-10 12:37:45,320] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +17: [2023-05-10 12:37:45,320] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +17: [2023-05-10 12:37:45,320] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +27: [2023-05-10 12:37:45,321] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +28: [2023-05-10 12:37:45,321] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +16: [2023-05-10 12:37:45,321] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +28: [2023-05-10 12:37:45,321] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +16: [2023-05-10 12:37:45,321] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +16: [2023-05-10 12:37:45,321] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt... +16: [2023-05-10 12:37:45,321] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt... +29: [2023-05-10 12:37:45,321] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +22: [2023-05-10 12:37:45,321] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +13: [2023-05-10 12:37:45,322] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +10: [2023-05-10 12:37:45,322] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +25: [2023-05-10 12:37:45,323] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt. + 7: [2023-05-10 12:37:45,323] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt. + 4: [2023-05-10 12:37:45,323] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt. + 9: [2023-05-10 12:37:45,323] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +25: [2023-05-10 12:37:45,323] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt. + 4: [2023-05-10 12:37:45,323] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt. +21: [2023-05-10 12:37:45,323] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt. +25: [2023-05-10 12:37:45,323] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt. + 4: [2023-05-10 12:37:45,323] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt. +21: [2023-05-10 12:37:45,323] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt. + 7: [2023-05-10 12:37:45,323] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt. + 7: [2023-05-10 12:37:45,323] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt. +21: [2023-05-10 12:37:45,323] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt. + 4: [2023-05-10 12:37:45,323] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt. + 9: [2023-05-10 12:37:45,323] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +25: [2023-05-10 12:37:45,323] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt. + 7: [2023-05-10 12:37:45,323] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt. +13: [2023-05-10 12:37:45,323] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt... +22: [2023-05-10 12:37:45,323] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +21: [2023-05-10 12:37:45,323] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt. +23: [2023-05-10 12:37:45,323] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt. +23: [2023-05-10 12:37:45,323] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt. +23: [2023-05-10 12:37:45,323] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt. +22: [2023-05-10 12:37:45,323] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +23: [2023-05-10 12:37:45,323] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_25-model_01-model_states.pt. +29: [2023-05-10 12:37:45,324] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +22: [2023-05-10 12:37:45,324] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +13: [2023-05-10 12:37:45,325] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. + 9: [2023-05-10 12:37:45,326] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... + 9: [2023-05-10 12:37:45,326] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +12: [2023-05-10 12:37:45,326] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +20: [2023-05-10 12:37:45,327] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +12: [2023-05-10 12:37:45,327] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt... +20: [2023-05-10 12:37:45,327] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt... + 2: [2023-05-10 12:37:45,328] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +12: [2023-05-10 12:37:45,328] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +12: [2023-05-10 12:37:45,329] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt... +20: [2023-05-10 12:37:45,329] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +20: [2023-05-10 12:37:45,329] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt... +29: [2023-05-10 12:37:45,330] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... + 2: [2023-05-10 12:37:45,330] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +28: [2023-05-10 12:37:45,330] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. + 8: [2023-05-10 12:37:45,330] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +28: [2023-05-10 12:37:45,331] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt... + 2: [2023-05-10 12:37:45,331] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... + 2: [2023-05-10 12:37:45,331] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... + 8: [2023-05-10 12:37:45,331] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt... +12: [2023-05-10 12:37:45,331] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +12: [2023-05-10 12:37:45,332] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt... + 7: [2023-05-10 12:37:45,332] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +28: [2023-05-10 12:37:45,332] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +28: [2023-05-10 12:37:45,332] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt... + 4: [2023-05-10 12:37:45,332] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +28: [2023-05-10 12:37:45,332] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +21: [2023-05-10 12:37:45,333] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +28: [2023-05-10 12:37:45,333] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt... + 4: [2023-05-10 12:37:45,333] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +21: [2023-05-10 12:37:45,333] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... + 4: [2023-05-10 12:37:45,333] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... + 4: [2023-05-10 12:37:45,333] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +25: [2023-05-10 12:37:45,333] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +21: [2023-05-10 12:37:45,333] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +21: [2023-05-10 12:37:45,333] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +25: [2023-05-10 12:37:45,333] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +13: [2023-05-10 12:37:45,333] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +25: [2023-05-10 12:37:45,333] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +25: [2023-05-10 12:37:45,334] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +12: [2023-05-10 12:37:45,334] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. + 7: [2023-05-10 12:37:45,334] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +10: [2023-05-10 12:37:45,334] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. + 7: [2023-05-10 12:37:45,334] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +10: [2023-05-10 12:37:45,334] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +10: [2023-05-10 12:37:45,334] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +10: [2023-05-10 12:37:45,334] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt... +10: [2023-05-10 12:37:45,335] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt... +10: [2023-05-10 12:37:45,335] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt... +12: [2023-05-10 12:37:45,334] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt... + 7: [2023-05-10 12:37:45,335] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +23: [2023-05-10 12:37:45,335] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +27: [2023-05-10 12:37:45,335] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +31: [2023-05-10 12:37:45,334] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +31: [2023-05-10 12:37:45,334] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +31: [2023-05-10 12:37:45,335] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +27: [2023-05-10 12:37:45,335] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +27: [2023-05-10 12:37:45,335] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt... +27: [2023-05-10 12:37:45,335] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt... +23: [2023-05-10 12:37:45,335] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +31: [2023-05-10 12:37:45,335] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt... +31: [2023-05-10 12:37:45,335] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt... +31: [2023-05-10 12:37:45,335] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt... +23: [2023-05-10 12:37:45,336] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +23: [2023-05-10 12:37:45,336] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt... +17: [2023-05-10 12:37:45,335] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +17: [2023-05-10 12:37:45,336] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt... + 8: [2023-05-10 12:37:45,336] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. + 8: [2023-05-10 12:37:45,336] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt... + 8: [2023-05-10 12:37:45,336] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. + 8: [2023-05-10 12:37:45,336] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt... +17: [2023-05-10 12:37:45,337] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +17: [2023-05-10 12:37:45,337] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +17: [2023-05-10 12:37:45,337] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt... +17: [2023-05-10 12:37:45,337] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt... +27: [2023-05-10 12:37:45,337] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +27: [2023-05-10 12:37:45,338] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt... +13: [2023-05-10 12:37:45,338] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +22: [2023-05-10 12:37:45,338] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +22: [2023-05-10 12:37:45,339] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt... + 9: [2023-05-10 12:37:45,340] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +20: [2023-05-10 12:37:45,340] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. + 9: [2023-05-10 12:37:45,341] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt... + 9: [2023-05-10 12:37:45,341] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. + 9: [2023-05-10 12:37:45,341] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt... +20: [2023-05-10 12:37:45,341] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt... +17: [2023-05-10 12:37:45,342] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +17: [2023-05-10 12:37:45,342] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt... +27: [2023-05-10 12:37:45,342] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. + 9: [2023-05-10 12:37:45,343] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. + 9: [2023-05-10 12:37:45,343] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt... +27: [2023-05-10 12:37:45,343] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt... +20: [2023-05-10 12:37:45,344] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. + 2: [2023-05-10 12:37:45,345] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +22: [2023-05-10 12:37:45,345] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +20: [2023-05-10 12:37:45,346] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt... +25: [2023-05-10 12:37:45,345] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +25: [2023-05-10 12:37:45,346] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt... + 2: [2023-05-10 12:37:45,346] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt... + 7: [2023-05-10 12:37:45,346] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. + 8: [2023-05-10 12:37:45,346] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. + 7: [2023-05-10 12:37:45,347] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt... +13: [2023-05-10 12:37:45,347] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +21: [2023-05-10 12:37:45,347] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +22: [2023-05-10 12:37:45,347] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt... +13: [2023-05-10 12:37:45,347] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. + 8: [2023-05-10 12:37:45,347] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt... +21: [2023-05-10 12:37:45,347] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +21: [2023-05-10 12:37:45,347] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +21: [2023-05-10 12:37:45,347] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt... +21: [2023-05-10 12:37:45,347] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt... +10: [2023-05-10 12:37:45,347] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +21: [2023-05-10 12:37:45,348] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt... + 7: [2023-05-10 12:37:45,348] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. + 2: [2023-05-10 12:37:45,348] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. + 2: [2023-05-10 12:37:45,348] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt... + 7: [2023-05-10 12:37:45,348] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt... +31: [2023-05-10 12:37:45,348] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +28: [2023-05-10 12:37:45,348] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. + 4: [2023-05-10 12:37:45,348] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. + 4: [2023-05-10 12:37:45,348] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. + 7: [2023-05-10 12:37:45,348] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. + 7: [2023-05-10 12:37:45,349] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt... + 4: [2023-05-10 12:37:45,349] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt... + 4: [2023-05-10 12:37:45,349] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt... + 4: [2023-05-10 12:37:45,349] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. + 9: [2023-05-10 12:37:45,348] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +25: [2023-05-10 12:37:45,349] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +25: [2023-05-10 12:37:45,349] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt... + 4: [2023-05-10 12:37:45,349] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. + 4: [2023-05-10 12:37:45,349] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt... +10: [2023-05-10 12:37:45,349] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt... +31: [2023-05-10 12:37:45,349] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt... + 4: [2023-05-10 12:37:45,349] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt... + 9: [2023-05-10 12:37:45,349] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt... +28: [2023-05-10 12:37:45,350] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt... +23: [2023-05-10 12:37:45,350] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +23: [2023-05-10 12:37:45,350] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +23: [2023-05-10 12:37:45,350] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt... +23: [2023-05-10 12:37:45,350] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt... +22: [2023-05-10 12:37:45,351] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +22: [2023-05-10 12:37:45,351] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +13: [2023-05-10 12:37:45,351] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +22: [2023-05-10 12:37:45,352] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt... +22: [2023-05-10 12:37:45,352] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt... + 7: [2023-05-10 12:37:45,354] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. + 7: [2023-05-10 12:37:45,354] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt... +25: [2023-05-10 12:37:45,354] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +25: [2023-05-10 12:37:45,354] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt... +13: [2023-05-10 12:37:45,356] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +23: [2023-05-10 12:37:45,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +23: [2023-05-10 12:37:45,356] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt... + 2: [2023-05-10 12:37:45,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. + 2: [2023-05-10 12:37:45,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +25: [2023-05-10 12:37:45,357] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. + 2: [2023-05-10 12:37:45,358] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt... +21: [2023-05-10 12:37:45,358] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. + 2: [2023-05-10 12:37:45,358] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt... +25: [2023-05-10 12:37:45,358] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt... +21: [2023-05-10 12:37:45,359] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt... +13: [2023-05-10 12:37:45,360] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +23: [2023-05-10 12:37:45,360] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_00-model_states.pt. +23: [2023-05-10 12:37:45,362] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt... +27: [2023-05-10 12:37:45,377] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +27: [2023-05-10 12:37:45,377] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +27: [2023-05-10 12:37:45,377] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +27: [2023-05-10 12:37:45,377] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +27: [2023-05-10 12:37:45,378] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +27: [2023-05-10 12:37:45,378] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +27: [2023-05-10 12:37:45,378] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. + 1: [2023-05-10 12:37:45,378] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. + 1: [2023-05-10 12:37:45,378] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... + 1: [2023-05-10 12:37:45,378] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. + 1: [2023-05-10 12:37:45,378] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. + 1: [2023-05-10 12:37:45,378] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. + 1: [2023-05-10 12:37:45,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +27: [2023-05-10 12:37:45,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... + 1: [2023-05-10 12:37:45,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... + 1: [2023-05-10 12:37:45,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +27: [2023-05-10 12:37:45,389] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +27: [2023-05-10 12:37:45,390] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. + 1: [2023-05-10 12:37:45,392] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. + 1: [2023-05-10 12:37:45,393] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. + 7: [2023-05-10 12:37:45,394] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +27: [2023-05-10 12:37:45,394] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. + 7: [2023-05-10 12:37:45,394] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. + 7: [2023-05-10 12:37:45,394] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... + 7: [2023-05-10 12:37:45,394] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. + 7: [2023-05-10 12:37:45,394] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... + 7: [2023-05-10 12:37:45,394] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... + 7: [2023-05-10 12:37:45,394] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. + 7: [2023-05-10 12:37:45,394] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... + 4: [2023-05-10 12:37:45,398] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. + 4: [2023-05-10 12:37:45,398] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... + 4: [2023-05-10 12:37:45,398] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. + 4: [2023-05-10 12:37:45,398] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +10: [2023-05-10 12:37:45,398] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +27: [2023-05-10 12:37:45,398] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +10: [2023-05-10 12:37:45,398] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +10: [2023-05-10 12:37:45,398] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +10: [2023-05-10 12:37:45,398] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. + 4: [2023-05-10 12:37:45,398] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... + 4: [2023-05-10 12:37:45,398] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... + 4: [2023-05-10 12:37:45,398] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +10: [2023-05-10 12:37:45,398] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +10: [2023-05-10 12:37:45,398] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... + 4: [2023-05-10 12:37:45,398] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... + 9: [2023-05-10 12:37:45,398] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. + 9: [2023-05-10 12:37:45,398] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. + 9: [2023-05-10 12:37:45,399] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... + 9: [2023-05-10 12:37:45,399] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +24: [2023-05-10 12:37:45,399] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +24: [2023-05-10 12:37:45,399] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +24: [2023-05-10 12:37:45,399] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +24: [2023-05-10 12:37:45,399] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... + 9: [2023-05-10 12:37:45,399] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. + 9: [2023-05-10 12:37:45,399] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +24: [2023-05-10 12:37:45,399] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. + 9: [2023-05-10 12:37:45,399] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +27: [2023-05-10 12:37:45,399] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +10: [2023-05-10 12:37:45,399] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +24: [2023-05-10 12:37:45,399] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +10: [2023-05-10 12:37:45,399] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +12: [2023-05-10 12:37:45,400] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +12: [2023-05-10 12:37:45,400] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +12: [2023-05-10 12:37:45,400] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +12: [2023-05-10 12:37:45,400] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +12: [2023-05-10 12:37:45,400] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +12: [2023-05-10 12:37:45,400] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +12: [2023-05-10 12:37:45,400] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +12: [2023-05-10 12:37:45,400] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +24: [2023-05-10 12:37:45,400] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... + 9: [2023-05-10 12:37:45,401] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +24: [2023-05-10 12:37:45,401] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +11: [2023-05-10 12:37:45,401] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt. +11: [2023-05-10 12:37:45,401] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt. +11: [2023-05-10 12:37:45,401] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt. +11: [2023-05-10 12:37:45,402] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt. + 1: [2023-05-10 12:37:45,402] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... + 1: [2023-05-10 12:37:45,403] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +27: [2023-05-10 12:37:45,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... + 1: [2023-05-10 12:37:45,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. + 1: [2023-05-10 12:37:45,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. + 7: [2023-05-10 12:37:45,406] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +27: [2023-05-10 12:37:45,410] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +11: [2023-05-10 12:37:45,410] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... + 4: [2023-05-10 12:37:45,410] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. + 9: [2023-05-10 12:37:45,411] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +11: [2023-05-10 12:37:45,411] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +10: [2023-05-10 12:37:45,411] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +11: [2023-05-10 12:37:45,412] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +11: [2023-05-10 12:37:45,412] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +24: [2023-05-10 12:37:45,412] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. + 9: [2023-05-10 12:37:45,413] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. + 7: [2023-05-10 12:37:45,414] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. + 7: [2023-05-10 12:37:45,414] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. + 7: [2023-05-10 12:37:45,414] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +12: [2023-05-10 12:37:45,415] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +12: [2023-05-10 12:37:45,415] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. + 4: [2023-05-10 12:37:45,415] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +12: [2023-05-10 12:37:45,416] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +12: [2023-05-10 12:37:45,416] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. + 4: [2023-05-10 12:37:45,416] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. + 1: [2023-05-10 12:37:45,417] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... + 1: [2023-05-10 12:37:45,417] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... + 7: [2023-05-10 12:37:45,417] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +10: [2023-05-10 12:37:45,417] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +10: [2023-05-10 12:37:45,417] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. + 6: [2023-05-10 12:37:45,417] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. + 6: [2023-05-10 12:37:45,417] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. + 6: [2023-05-10 12:37:45,417] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. + 6: [2023-05-10 12:37:45,418] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... + 6: [2023-05-10 12:37:45,418] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... + 6: [2023-05-10 12:37:45,418] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... + 4: [2023-05-10 12:37:45,418] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. + 6: [2023-05-10 12:37:45,418] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. + 6: [2023-05-10 12:37:45,418] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +24: [2023-05-10 12:37:45,418] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +10: [2023-05-10 12:37:45,419] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... + 4: [2023-05-10 12:37:45,419] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +27: [2023-05-10 12:37:45,419] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... + 9: [2023-05-10 12:37:45,419] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... + 9: [2023-05-10 12:37:45,420] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +10: [2023-05-10 12:37:45,420] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +24: [2023-05-10 12:37:45,423] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +28: [2023-05-10 12:37:45,423] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +28: [2023-05-10 12:37:45,423] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. + 7: [2023-05-10 12:37:45,423] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +28: [2023-05-10 12:37:45,423] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +28: [2023-05-10 12:37:45,423] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... + 7: [2023-05-10 12:37:45,424] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +24: [2023-05-10 12:37:45,424] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... + 7: [2023-05-10 12:37:45,424] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +12: [2023-05-10 12:37:45,425] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... + 9: [2023-05-10 12:37:45,425] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +31: [2023-05-10 12:37:45,425] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +31: [2023-05-10 12:37:45,425] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +12: [2023-05-10 12:37:45,425] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +28: [2023-05-10 12:37:45,426] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +28: [2023-05-10 12:37:45,426] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. + 4: [2023-05-10 12:37:45,426] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +12: [2023-05-10 12:37:45,426] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +12: [2023-05-10 12:37:45,426] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +31: [2023-05-10 12:37:45,426] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +28: [2023-05-10 12:37:45,427] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... + 9: [2023-05-10 12:37:45,427] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +28: [2023-05-10 12:37:45,427] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... + 4: [2023-05-10 12:37:45,428] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +31: [2023-05-10 12:37:45,428] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +31: [2023-05-10 12:37:45,428] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +31: [2023-05-10 12:37:45,428] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +24: [2023-05-10 12:37:45,428] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +31: [2023-05-10 12:37:45,428] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. + 4: [2023-05-10 12:37:45,429] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +10: [2023-05-10 12:37:45,429] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... + 9: [2023-05-10 12:37:45,430] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +10: [2023-05-10 12:37:45,430] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +31: [2023-05-10 12:37:45,430] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +10: [2023-05-10 12:37:45,430] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +24: [2023-05-10 12:37:45,432] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. + 1: [2023-05-10 12:37:45,433] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt. + 1: [2023-05-10 12:37:45,433] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt. + 1: [2023-05-10 12:37:45,433] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt. +24: [2023-05-10 12:37:45,433] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... + 1: [2023-05-10 12:37:45,433] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt. + 6: [2023-05-10 12:37:45,433] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. + 6: [2023-05-10 12:37:45,433] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. + 6: [2023-05-10 12:37:45,433] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. + 9: [2023-05-10 12:37:45,436] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... + 3: [2023-05-10 12:37:45,438] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. + 3: [2023-05-10 12:37:45,438] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. + 3: [2023-05-10 12:37:45,438] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... + 3: [2023-05-10 12:37:45,438] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... + 3: [2023-05-10 12:37:45,438] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. + 3: [2023-05-10 12:37:45,438] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... + 3: [2023-05-10 12:37:45,438] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. + 3: [2023-05-10 12:37:45,438] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +31: [2023-05-10 12:37:45,439] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +31: [2023-05-10 12:37:45,440] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +24: [2023-05-10 12:37:45,440] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... + 5: [2023-05-10 12:37:45,440] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt. + 5: [2023-05-10 12:37:45,440] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt. + 5: [2023-05-10 12:37:45,440] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt. + 5: [2023-05-10 12:37:45,441] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt. + 6: [2023-05-10 12:37:45,441] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +28: [2023-05-10 12:37:45,441] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +28: [2023-05-10 12:37:45,441] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. + 6: [2023-05-10 12:37:45,442] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... + 1: [2023-05-10 12:37:45,443] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... + 1: [2023-05-10 12:37:45,444] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... + 1: [2023-05-10 12:37:45,444] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... + 1: [2023-05-10 12:37:45,444] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... + 6: [2023-05-10 12:37:45,444] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... + 6: [2023-05-10 12:37:45,446] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +31: [2023-05-10 12:37:45,447] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +31: [2023-05-10 12:37:45,449] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... + 3: [2023-05-10 12:37:45,450] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. + 6: [2023-05-10 12:37:45,450] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... + 5: [2023-05-10 12:37:45,451] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... + 5: [2023-05-10 12:37:45,451] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +26: [2023-05-10 12:37:45,451] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +26: [2023-05-10 12:37:45,451] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +26: [2023-05-10 12:37:45,451] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +26: [2023-05-10 12:37:45,451] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. + 5: [2023-05-10 12:37:45,451] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +28: [2023-05-10 12:37:45,451] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +26: [2023-05-10 12:37:45,451] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +26: [2023-05-10 12:37:45,451] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +26: [2023-05-10 12:37:45,452] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +31: [2023-05-10 12:37:45,452] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. + 5: [2023-05-10 12:37:45,452] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +26: [2023-05-10 12:37:45,453] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +28: [2023-05-10 12:37:45,453] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +28: [2023-05-10 12:37:45,453] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +31: [2023-05-10 12:37:45,457] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. + 3: [2023-05-10 12:37:45,458] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. + 3: [2023-05-10 12:37:45,458] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. + 3: [2023-05-10 12:37:45,458] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. + 1: [2023-05-10 12:37:45,458] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. + 3: [2023-05-10 12:37:45,458] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... + 6: [2023-05-10 12:37:45,458] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt. + 6: [2023-05-10 12:37:45,458] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt. + 6: [2023-05-10 12:37:45,458] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt. + 1: [2023-05-10 12:37:45,459] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt... + 6: [2023-05-10 12:37:45,459] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt. + 1: [2023-05-10 12:37:45,459] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. + 1: [2023-05-10 12:37:45,459] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt... + 1: [2023-05-10 12:37:45,459] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. + 1: [2023-05-10 12:37:45,459] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. + 1: [2023-05-10 12:37:45,459] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt... + 1: [2023-05-10 12:37:45,459] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt... +31: [2023-05-10 12:37:45,460] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +28: [2023-05-10 12:37:45,461] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +28: [2023-05-10 12:37:45,462] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +26: [2023-05-10 12:37:45,464] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. + 3: [2023-05-10 12:37:45,467] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +26: [2023-05-10 12:37:45,467] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +26: [2023-05-10 12:37:45,467] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. + 6: [2023-05-10 12:37:45,468] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... + 3: [2023-05-10 12:37:45,468] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +31: [2023-05-10 12:37:45,468] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... + 6: [2023-05-10 12:37:45,468] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... + 6: [2023-05-10 12:37:45,469] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... + 6: [2023-05-10 12:37:45,469] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... + 3: [2023-05-10 12:37:45,469] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +24: [2023-05-10 12:37:45,469] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt. +24: [2023-05-10 12:37:45,469] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt. +24: [2023-05-10 12:37:45,469] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt. +24: [2023-05-10 12:37:45,469] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt. +28: [2023-05-10 12:37:45,471] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +26: [2023-05-10 12:37:45,474] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +26: [2023-05-10 12:37:45,476] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +26: [2023-05-10 12:37:45,478] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +26: [2023-05-10 12:37:45,479] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. + 6: [2023-05-10 12:37:45,480] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +24: [2023-05-10 12:37:45,480] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... + 6: [2023-05-10 12:37:45,480] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt... +24: [2023-05-10 12:37:45,481] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +24: [2023-05-10 12:37:45,481] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +24: [2023-05-10 12:37:45,483] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +26: [2023-05-10 12:37:45,487] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... + 6: [2023-05-10 12:37:45,487] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. + 6: [2023-05-10 12:37:45,487] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. + 6: [2023-05-10 12:37:45,487] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. + 6: [2023-05-10 12:37:45,487] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt... + 6: [2023-05-10 12:37:45,487] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt... + 6: [2023-05-10 12:37:45,487] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt... +24: [2023-05-10 12:37:45,496] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +24: [2023-05-10 12:37:45,497] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt... +24: [2023-05-10 12:37:45,499] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +24: [2023-05-10 12:37:45,499] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt... +24: [2023-05-10 12:37:45,500] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +24: [2023-05-10 12:37:45,501] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt... +24: [2023-05-10 12:37:45,502] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +24: [2023-05-10 12:37:45,502] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt... +16: [2023-05-10 12:37:45,529] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +16: [2023-05-10 12:37:45,529] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +16: [2023-05-10 12:37:45,529] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +16: [2023-05-10 12:37:45,529] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +16: [2023-05-10 12:37:45,529] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +16: [2023-05-10 12:37:45,529] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +16: [2023-05-10 12:37:45,529] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +16: [2023-05-10 12:37:45,529] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +11: [2023-05-10 12:37:45,529] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +11: [2023-05-10 12:37:45,529] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +11: [2023-05-10 12:37:45,529] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +11: [2023-05-10 12:37:45,529] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +11: [2023-05-10 12:37:45,529] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +11: [2023-05-10 12:37:45,530] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +11: [2023-05-10 12:37:45,530] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +11: [2023-05-10 12:37:45,529] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +11: [2023-05-10 12:37:45,530] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +11: [2023-05-10 12:37:45,530] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt... +11: [2023-05-10 12:37:45,530] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt... +11: [2023-05-10 12:37:45,530] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt... +11: [2023-05-10 12:37:45,530] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +11: [2023-05-10 12:37:45,530] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +23: [2023-05-10 12:37:45,531] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +23: [2023-05-10 12:37:45,531] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +23: [2023-05-10 12:37:45,531] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +23: [2023-05-10 12:37:45,531] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +23: [2023-05-10 12:37:45,531] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +11: [2023-05-10 12:37:45,531] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt... +23: [2023-05-10 12:37:45,531] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +23: [2023-05-10 12:37:45,532] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +11: [2023-05-10 12:37:45,532] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... + 2: [2023-05-10 12:37:45,533] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +17: [2023-05-10 12:37:45,533] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. + 2: [2023-05-10 12:37:45,533] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +17: [2023-05-10 12:37:45,533] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +17: [2023-05-10 12:37:45,533] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +17: [2023-05-10 12:37:45,533] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... + 2: [2023-05-10 12:37:45,534] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +17: [2023-05-10 12:37:45,534] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +17: [2023-05-10 12:37:45,534] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +17: [2023-05-10 12:37:45,534] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +23: [2023-05-10 12:37:45,533] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +17: [2023-05-10 12:37:45,535] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... + 2: [2023-05-10 12:37:45,536] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +25: [2023-05-10 12:37:45,536] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. + 2: [2023-05-10 12:37:45,536] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +25: [2023-05-10 12:37:45,536] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... + 2: [2023-05-10 12:37:45,536] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +25: [2023-05-10 12:37:45,536] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +25: [2023-05-10 12:37:45,536] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +25: [2023-05-10 12:37:45,536] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +25: [2023-05-10 12:37:45,536] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +25: [2023-05-10 12:37:45,536] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. + 5: [2023-05-10 12:37:45,537] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. + 5: [2023-05-10 12:37:45,537] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. + 5: [2023-05-10 12:37:45,537] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. + 5: [2023-05-10 12:37:45,537] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... + 5: [2023-05-10 12:37:45,537] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... + 2: [2023-05-10 12:37:45,537] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +25: [2023-05-10 12:37:45,537] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... + 2: [2023-05-10 12:37:45,537] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... + 5: [2023-05-10 12:37:45,538] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt... + 5: [2023-05-10 12:37:45,538] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +19: [2023-05-10 12:37:45,538] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +19: [2023-05-10 12:37:45,538] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +19: [2023-05-10 12:37:45,538] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... + 5: [2023-05-10 12:37:45,538] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt... +19: [2023-05-10 12:37:45,538] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +19: [2023-05-10 12:37:45,538] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +19: [2023-05-10 12:37:45,538] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +19: [2023-05-10 12:37:45,538] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. + 5: [2023-05-10 12:37:45,538] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. + 5: [2023-05-10 12:37:45,538] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. + 5: [2023-05-10 12:37:45,538] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +19: [2023-05-10 12:37:45,538] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... + 5: [2023-05-10 12:37:45,538] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. + 5: [2023-05-10 12:37:45,538] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt... + 5: [2023-05-10 12:37:45,538] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... + 5: [2023-05-10 12:37:45,540] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt... + 5: [2023-05-10 12:37:45,540] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +16: [2023-05-10 12:37:45,541] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +16: [2023-05-10 12:37:45,542] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +23: [2023-05-10 12:37:45,543] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +11: [2023-05-10 12:37:45,544] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +23: [2023-05-10 12:37:45,544] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +16: [2023-05-10 12:37:45,544] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +16: [2023-05-10 12:37:45,544] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +11: [2023-05-10 12:37:45,545] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +11: [2023-05-10 12:37:45,545] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +23: [2023-05-10 12:37:45,545] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. + 2: [2023-05-10 12:37:45,546] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +17: [2023-05-10 12:37:45,546] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +25: [2023-05-10 12:37:45,547] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +17: [2023-05-10 12:37:45,548] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +17: [2023-05-10 12:37:45,548] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +16: [2023-05-10 12:37:45,551] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +19: [2023-05-10 12:37:45,551] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +19: [2023-05-10 12:37:45,551] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +25: [2023-05-10 12:37:45,551] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +25: [2023-05-10 12:37:45,551] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +19: [2023-05-10 12:37:45,553] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. + 5: [2023-05-10 12:37:45,553] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. + 5: [2023-05-10 12:37:45,553] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +23: [2023-05-10 12:37:45,553] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +16: [2023-05-10 12:37:45,554] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... + 5: [2023-05-10 12:37:45,554] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +16: [2023-05-10 12:37:45,554] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +11: [2023-05-10 12:37:45,554] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +11: [2023-05-10 12:37:45,554] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +11: [2023-05-10 12:37:45,554] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +23: [2023-05-10 12:37:45,555] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +16: [2023-05-10 12:37:45,555] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +23: [2023-05-10 12:37:45,556] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +25: [2023-05-10 12:37:45,557] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +17: [2023-05-10 12:37:45,557] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +23: [2023-05-10 12:37:45,557] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +30: [2023-05-10 12:37:45,557] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +29: [2023-05-10 12:37:45,557] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +30: [2023-05-10 12:37:45,557] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +29: [2023-05-10 12:37:45,558] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... + 2: [2023-05-10 12:37:45,558] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +21: [2023-05-10 12:37:45,558] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +21: [2023-05-10 12:37:45,558] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +21: [2023-05-10 12:37:45,558] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +14: [2023-05-10 12:37:45,557] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +14: [2023-05-10 12:37:45,557] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +14: [2023-05-10 12:37:45,557] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +14: [2023-05-10 12:37:45,558] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +14: [2023-05-10 12:37:45,558] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +30: [2023-05-10 12:37:45,557] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +30: [2023-05-10 12:37:45,558] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +30: [2023-05-10 12:37:45,558] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +29: [2023-05-10 12:37:45,558] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. + 0: [2023-05-10 12:37:45,557] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. + 0: [2023-05-10 12:37:45,557] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. + 0: [2023-05-10 12:37:45,557] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. + 0: [2023-05-10 12:37:45,558] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... + 0: [2023-05-10 12:37:45,558] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +14: [2023-05-10 12:37:45,558] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... + 0: [2023-05-10 12:37:45,558] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... + 0: [2023-05-10 12:37:45,558] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. + 0: [2023-05-10 12:37:45,558] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +14: [2023-05-10 12:37:45,558] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +14: [2023-05-10 12:37:45,558] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +29: [2023-05-10 12:37:45,558] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +21: [2023-05-10 12:37:45,558] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +21: [2023-05-10 12:37:45,558] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +21: [2023-05-10 12:37:45,558] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +21: [2023-05-10 12:37:45,558] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +21: [2023-05-10 12:37:45,558] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +22: [2023-05-10 12:37:45,558] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +22: [2023-05-10 12:37:45,559] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +22: [2023-05-10 12:37:45,559] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +22: [2023-05-10 12:37:45,559] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +22: [2023-05-10 12:37:45,559] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +22: [2023-05-10 12:37:45,559] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +17: [2023-05-10 12:37:45,559] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +22: [2023-05-10 12:37:45,559] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... + 8: [2023-05-10 12:37:45,559] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. + 8: [2023-05-10 12:37:45,559] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... + 8: [2023-05-10 12:37:45,559] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. + 8: [2023-05-10 12:37:45,559] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +29: [2023-05-10 12:37:45,559] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. + 8: [2023-05-10 12:37:45,559] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. + 8: [2023-05-10 12:37:45,559] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. + 8: [2023-05-10 12:37:45,559] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... + 8: [2023-05-10 12:37:45,559] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +29: [2023-05-10 12:37:45,559] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +17: [2023-05-10 12:37:45,559] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +25: [2023-05-10 12:37:45,560] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. + 2: [2023-05-10 12:37:45,560] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +15: [2023-05-10 12:37:45,560] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +15: [2023-05-10 12:37:45,560] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +19: [2023-05-10 12:37:45,560] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +15: [2023-05-10 12:37:45,560] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +15: [2023-05-10 12:37:45,560] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +15: [2023-05-10 12:37:45,560] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +22: [2023-05-10 12:37:45,560] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +15: [2023-05-10 12:37:45,560] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +15: [2023-05-10 12:37:45,560] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +30: [2023-05-10 12:37:45,560] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +17: [2023-05-10 12:37:45,560] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +30: [2023-05-10 12:37:45,560] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +29: [2023-05-10 12:37:45,561] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +15: [2023-05-10 12:37:45,561] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +29: [2023-05-10 12:37:45,561] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +30: [2023-05-10 12:37:45,562] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +19: [2023-05-10 12:37:45,562] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... + 2: [2023-05-10 12:37:45,561] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +25: [2023-05-10 12:37:45,563] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +11: [2023-05-10 12:37:45,563] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +25: [2023-05-10 12:37:45,563] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... + 5: [2023-05-10 12:37:45,564] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... + 5: [2023-05-10 12:37:45,564] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +19: [2023-05-10 12:37:45,564] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +19: [2023-05-10 12:37:45,564] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +18: [2023-05-10 12:37:45,565] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +18: [2023-05-10 12:37:45,565] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +18: [2023-05-10 12:37:45,565] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +18: [2023-05-10 12:37:45,565] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +18: [2023-05-10 12:37:45,565] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +18: [2023-05-10 12:37:45,565] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +18: [2023-05-10 12:37:45,565] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +18: [2023-05-10 12:37:45,565] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... + 5: [2023-05-10 12:37:45,565] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +23: [2023-05-10 12:37:45,566] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +26: [2023-05-10 12:37:45,567] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt. +26: [2023-05-10 12:37:45,567] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt. +26: [2023-05-10 12:37:45,567] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt. + 2: [2023-05-10 12:37:45,567] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +26: [2023-05-10 12:37:45,567] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt. +18: [2023-05-10 12:37:45,568] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt. +18: [2023-05-10 12:37:45,568] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt. + 2: [2023-05-10 12:37:45,568] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +17: [2023-05-10 12:37:45,569] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +29: [2023-05-10 12:37:45,569] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. + 5: [2023-05-10 12:37:45,569] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +19: [2023-05-10 12:37:45,569] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +18: [2023-05-10 12:37:45,569] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt. + 2: [2023-05-10 12:37:45,570] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +18: [2023-05-10 12:37:45,570] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt. +25: [2023-05-10 12:37:45,570] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +22: [2023-05-10 12:37:45,570] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. + 8: [2023-05-10 12:37:45,570] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +15: [2023-05-10 12:37:45,572] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +19: [2023-05-10 12:37:45,573] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt. +13: [2023-05-10 12:37:45,573] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +14: [2023-05-10 12:37:45,573] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +14: [2023-05-10 12:37:45,573] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +14: [2023-05-10 12:37:45,573] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +11: [2023-05-10 12:37:45,573] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +13: [2023-05-10 12:37:45,573] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +13: [2023-05-10 12:37:45,573] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +13: [2023-05-10 12:37:45,573] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +13: [2023-05-10 12:37:45,573] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +13: [2023-05-10 12:37:45,573] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +13: [2023-05-10 12:37:45,573] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +13: [2023-05-10 12:37:45,573] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +21: [2023-05-10 12:37:45,574] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +21: [2023-05-10 12:37:45,574] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +19: [2023-05-10 12:37:45,574] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt. +21: [2023-05-10 12:37:45,574] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +30: [2023-05-10 12:37:45,574] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +28: [2023-05-10 12:37:45,574] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt. +28: [2023-05-10 12:37:45,574] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt. +29: [2023-05-10 12:37:45,574] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +28: [2023-05-10 12:37:45,575] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt. +29: [2023-05-10 12:37:45,575] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +15: [2023-05-10 12:37:45,575] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +28: [2023-05-10 12:37:45,575] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt. +15: [2023-05-10 12:37:45,576] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +26: [2023-05-10 12:37:45,576] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +22: [2023-05-10 12:37:45,576] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +22: [2023-05-10 12:37:45,577] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +18: [2023-05-10 12:37:45,577] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... + 2: [2023-05-10 12:37:45,577] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +14: [2023-05-10 12:37:45,577] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +19: [2023-05-10 12:37:45,577] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt. +26: [2023-05-10 12:37:45,577] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +19: [2023-05-10 12:37:45,577] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt. +26: [2023-05-10 12:37:45,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +29: [2023-05-10 12:37:45,578] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +29: [2023-05-10 12:37:45,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +20: [2023-05-10 12:37:45,578] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt. + 5: [2023-05-10 12:37:45,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +20: [2023-05-10 12:37:45,578] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt. +18: [2023-05-10 12:37:45,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +30: [2023-05-10 12:37:45,578] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt. +30: [2023-05-10 12:37:45,578] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt. +26: [2023-05-10 12:37:45,579] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +30: [2023-05-10 12:37:45,579] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt. + 8: [2023-05-10 12:37:45,579] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... + 8: [2023-05-10 12:37:45,579] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. + 8: [2023-05-10 12:37:45,579] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. + 8: [2023-05-10 12:37:45,579] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +21: [2023-05-10 12:37:45,580] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +15: [2023-05-10 12:37:45,580] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... + 0: [2023-05-10 12:37:45,581] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. + 0: [2023-05-10 12:37:45,581] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. + 0: [2023-05-10 12:37:45,581] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. + 0: [2023-05-10 12:37:45,581] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +14: [2023-05-10 12:37:45,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +18: [2023-05-10 12:37:45,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +20: [2023-05-10 12:37:45,583] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt. +19: [2023-05-10 12:37:45,583] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +20: [2023-05-10 12:37:45,583] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +20: [2023-05-10 12:37:45,583] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +14: [2023-05-10 12:37:45,583] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +14: [2023-05-10 12:37:45,583] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +20: [2023-05-10 12:37:45,583] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +20: [2023-05-10 12:37:45,583] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +20: [2023-05-10 12:37:45,583] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +20: [2023-05-10 12:37:45,583] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +20: [2023-05-10 12:37:45,584] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +20: [2023-05-10 12:37:45,584] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +30: [2023-05-10 12:37:45,584] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +17: [2023-05-10 12:37:45,584] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt. +17: [2023-05-10 12:37:45,584] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt. +13: [2023-05-10 12:37:45,584] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +17: [2023-05-10 12:37:45,584] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt. +22: [2023-05-10 12:37:45,584] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +17: [2023-05-10 12:37:45,584] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt. +20: [2023-05-10 12:37:45,584] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt. +14: [2023-05-10 12:37:45,584] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt. +14: [2023-05-10 12:37:45,584] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt. +30: [2023-05-10 12:37:45,584] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt. +21: [2023-05-10 12:37:45,584] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +28: [2023-05-10 12:37:45,584] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +28: [2023-05-10 12:37:45,584] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +21: [2023-05-10 12:37:45,585] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +21: [2023-05-10 12:37:45,585] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +28: [2023-05-10 12:37:45,585] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +19: [2023-05-10 12:37:45,585] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +19: [2023-05-10 12:37:45,586] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +22: [2023-05-10 12:37:45,586] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +22: [2023-05-10 12:37:45,586] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +18: [2023-05-10 12:37:45,586] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +28: [2023-05-10 12:37:45,587] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +29: [2023-05-10 12:37:45,587] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +29: [2023-05-10 12:37:45,587] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +30: [2023-05-10 12:37:45,588] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +14: [2023-05-10 12:37:45,588] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +19: [2023-05-10 12:37:45,588] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +15: [2023-05-10 12:37:45,588] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +15: [2023-05-10 12:37:45,588] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +29: [2023-05-10 12:37:45,588] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +29: [2023-05-10 12:37:45,588] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt. +21: [2023-05-10 12:37:45,588] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +30: [2023-05-10 12:37:45,588] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +29: [2023-05-10 12:37:45,589] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt. +29: [2023-05-10 12:37:45,589] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt. +30: [2023-05-10 12:37:45,589] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +29: [2023-05-10 12:37:45,589] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt. + 3: [2023-05-10 12:37:45,589] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt. + 3: [2023-05-10 12:37:45,589] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt. + 3: [2023-05-10 12:37:45,589] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt. + 8: [2023-05-10 12:37:45,589] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +26: [2023-05-10 12:37:45,589] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +22: [2023-05-10 12:37:45,590] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +26: [2023-05-10 12:37:45,589] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt... +30: [2023-05-10 12:37:45,590] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... + 8: [2023-05-10 12:37:45,590] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +14: [2023-05-10 12:37:45,590] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt. +14: [2023-05-10 12:37:45,590] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt. + 8: [2023-05-10 12:37:45,590] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +20: [2023-05-10 12:37:45,591] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +20: [2023-05-10 12:37:45,591] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +13: [2023-05-10 12:37:45,592] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +13: [2023-05-10 12:37:45,592] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +13: [2023-05-10 12:37:45,592] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +26: [2023-05-10 12:37:45,592] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +18: [2023-05-10 12:37:45,592] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. + 3: [2023-05-10 12:37:45,592] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt. +18: [2023-05-10 12:37:45,593] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt... + 0: [2023-05-10 12:37:45,593] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +26: [2023-05-10 12:37:45,592] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt... +14: [2023-05-10 12:37:45,593] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +17: [2023-05-10 12:37:45,593] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +20: [2023-05-10 12:37:45,593] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +17: [2023-05-10 12:37:45,594] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... + 0: [2023-05-10 12:37:45,594] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +30: [2023-05-10 12:37:45,594] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +26: [2023-05-10 12:37:45,593] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +26: [2023-05-10 12:37:45,594] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt... +30: [2023-05-10 12:37:45,594] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +30: [2023-05-10 12:37:45,594] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +17: [2023-05-10 12:37:45,594] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +14: [2023-05-10 12:37:45,596] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +17: [2023-05-10 12:37:45,596] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +15: [2023-05-10 12:37:45,596] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +20: [2023-05-10 12:37:45,596] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... + 0: [2023-05-10 12:37:45,596] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... + 0: [2023-05-10 12:37:45,596] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +13: [2023-05-10 12:37:45,597] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +22: [2023-05-10 12:37:45,598] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +29: [2023-05-10 12:37:45,598] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +30: [2023-05-10 12:37:45,598] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... + 3: [2023-05-10 12:37:45,598] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +29: [2023-05-10 12:37:45,598] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +29: [2023-05-10 12:37:45,598] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +19: [2023-05-10 12:37:45,598] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +28: [2023-05-10 12:37:45,598] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +19: [2023-05-10 12:37:45,599] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt... +28: [2023-05-10 12:37:45,599] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +28: [2023-05-10 12:37:45,599] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt... +28: [2023-05-10 12:37:45,599] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt... +14: [2023-05-10 12:37:45,599] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... + 3: [2023-05-10 12:37:45,600] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... + 3: [2023-05-10 12:37:45,600] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +14: [2023-05-10 12:37:45,600] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +29: [2023-05-10 12:37:45,601] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +18: [2023-05-10 12:37:45,601] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +16: [2023-05-10 12:37:45,602] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt. +18: [2023-05-10 12:37:45,602] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +18: [2023-05-10 12:37:45,602] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +16: [2023-05-10 12:37:45,602] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt. +16: [2023-05-10 12:37:45,602] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt. +18: [2023-05-10 12:37:45,602] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +16: [2023-05-10 12:37:45,602] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt. + 3: [2023-05-10 12:37:45,602] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +13: [2023-05-10 12:37:45,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +13: [2023-05-10 12:37:45,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +19: [2023-05-10 12:37:45,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +19: [2023-05-10 12:37:45,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +19: [2023-05-10 12:37:45,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt... +19: [2023-05-10 12:37:45,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt... +25: [2023-05-10 12:37:45,604] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt. +20: [2023-05-10 12:37:45,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +20: [2023-05-10 12:37:45,604] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +30: [2023-05-10 12:37:45,604] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +25: [2023-05-10 12:37:45,604] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt. +25: [2023-05-10 12:37:45,604] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt. +18: [2023-05-10 12:37:45,604] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +25: [2023-05-10 12:37:45,604] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt. +15: [2023-05-10 12:37:45,605] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +30: [2023-05-10 12:37:45,605] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +18: [2023-05-10 12:37:45,605] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt... +13: [2023-05-10 12:37:45,607] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +28: [2023-05-10 12:37:45,608] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +30: [2023-05-10 12:37:45,608] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +30: [2023-05-10 12:37:45,609] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt... +26: [2023-05-10 12:37:45,608] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +28: [2023-05-10 12:37:45,609] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt... +17: [2023-05-10 12:37:45,609] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +17: [2023-05-10 12:37:45,609] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +30: [2023-05-10 12:37:45,609] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +30: [2023-05-10 12:37:45,609] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt... +28: [2023-05-10 12:37:45,609] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. + 8: [2023-05-10 12:37:45,609] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt. + 8: [2023-05-10 12:37:45,609] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt. + 8: [2023-05-10 12:37:45,609] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt. +17: [2023-05-10 12:37:45,609] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +17: [2023-05-10 12:37:45,609] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt... +17: [2023-05-10 12:37:45,609] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt... +17: [2023-05-10 12:37:45,609] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt... +30: [2023-05-10 12:37:45,610] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +30: [2023-05-10 12:37:45,610] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt... + 3: [2023-05-10 12:37:45,610] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +20: [2023-05-10 12:37:45,610] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +20: [2023-05-10 12:37:45,610] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +22: [2023-05-10 12:37:45,610] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt. +26: [2023-05-10 12:37:45,610] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt... +28: [2023-05-10 12:37:45,611] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt... +16: [2023-05-10 12:37:45,611] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +22: [2023-05-10 12:37:45,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt. + 3: [2023-05-10 12:37:45,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt... +19: [2023-05-10 12:37:45,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +14: [2023-05-10 12:37:45,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +29: [2023-05-10 12:37:45,612] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +14: [2023-05-10 12:37:45,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt... +29: [2023-05-10 12:37:45,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt... +16: [2023-05-10 12:37:45,613] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +16: [2023-05-10 12:37:45,613] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +16: [2023-05-10 12:37:45,613] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +19: [2023-05-10 12:37:45,613] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt... + 8: [2023-05-10 12:37:45,613] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt. +18: [2023-05-10 12:37:45,613] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +25: [2023-05-10 12:37:45,614] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +25: [2023-05-10 12:37:45,614] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +22: [2023-05-10 12:37:45,614] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt. + 3: [2023-05-10 12:37:45,614] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +25: [2023-05-10 12:37:45,614] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... + 3: [2023-05-10 12:37:45,614] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt... +22: [2023-05-10 12:37:45,614] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt. +14: [2023-05-10 12:37:45,614] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +14: [2023-05-10 12:37:45,614] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +14: [2023-05-10 12:37:45,615] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt... +14: [2023-05-10 12:37:45,615] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt... +18: [2023-05-10 12:37:45,615] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +20: [2023-05-10 12:37:45,615] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +25: [2023-05-10 12:37:45,615] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +20: [2023-05-10 12:37:45,615] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +20: [2023-05-10 12:37:45,615] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +18: [2023-05-10 12:37:45,615] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +20: [2023-05-10 12:37:45,616] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt... +29: [2023-05-10 12:37:45,616] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +29: [2023-05-10 12:37:45,616] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt... +18: [2023-05-10 12:37:45,617] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +14: [2023-05-10 12:37:45,618] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +14: [2023-05-10 12:37:45,619] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt... +18: [2023-05-10 12:37:45,619] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +18: [2023-05-10 12:37:45,619] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt... +27: [2023-05-10 12:37:45,619] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +17: [2023-05-10 12:37:45,619] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +27: [2023-05-10 12:37:45,619] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +27: [2023-05-10 12:37:45,619] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +27: [2023-05-10 12:37:45,619] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +27: [2023-05-10 12:37:45,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +27: [2023-05-10 12:37:45,620] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. + 8: [2023-05-10 12:37:45,619] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +20: [2023-05-10 12:37:45,620] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +27: [2023-05-10 12:37:45,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... + 8: [2023-05-10 12:37:45,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +22: [2023-05-10 12:37:45,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +20: [2023-05-10 12:37:45,621] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +17: [2023-05-10 12:37:45,621] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt... +27: [2023-05-10 12:37:45,621] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +29: [2023-05-10 12:37:45,621] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +29: [2023-05-10 12:37:45,621] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt... +20: [2023-05-10 12:37:45,621] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +20: [2023-05-10 12:37:45,621] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +20: [2023-05-10 12:37:45,621] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt... +20: [2023-05-10 12:37:45,621] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt... +30: [2023-05-10 12:37:45,621] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +22: [2023-05-10 12:37:45,622] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +30: [2023-05-10 12:37:45,623] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt... + 8: [2023-05-10 12:37:45,623] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... + 8: [2023-05-10 12:37:45,623] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +16: [2023-05-10 12:37:45,623] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +22: [2023-05-10 12:37:45,624] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +22: [2023-05-10 12:37:45,624] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +16: [2023-05-10 12:37:45,624] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt... +25: [2023-05-10 12:37:45,625] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +25: [2023-05-10 12:37:45,625] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. + 3: [2023-05-10 12:37:45,626] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. + 3: [2023-05-10 12:37:45,626] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +25: [2023-05-10 12:37:45,626] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt... +25: [2023-05-10 12:37:45,626] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt... + 3: [2023-05-10 12:37:45,627] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt... + 3: [2023-05-10 12:37:45,627] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt... +20: [2023-05-10 12:37:45,628] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +20: [2023-05-10 12:37:45,630] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt... +18: [2023-05-10 12:37:45,630] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +27: [2023-05-10 12:37:45,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +18: [2023-05-10 12:37:45,631] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt... +25: [2023-05-10 12:37:45,633] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +25: [2023-05-10 12:37:45,633] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt... +27: [2023-05-10 12:37:45,633] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +27: [2023-05-10 12:37:45,633] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +29: [2023-05-10 12:37:45,634] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. + 8: [2023-05-10 12:37:45,635] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. + 8: [2023-05-10 12:37:45,635] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. + 8: [2023-05-10 12:37:45,636] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt... + 8: [2023-05-10 12:37:45,636] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt... +29: [2023-05-10 12:37:45,636] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt... +16: [2023-05-10 12:37:45,637] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +16: [2023-05-10 12:37:45,637] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. + 8: [2023-05-10 12:37:45,637] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. + 8: [2023-05-10 12:37:45,638] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt... + 0: [2023-05-10 12:37:45,638] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt. + 0: [2023-05-10 12:37:45,638] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt. + 0: [2023-05-10 12:37:45,638] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt. + 0: [2023-05-10 12:37:45,638] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt. +16: [2023-05-10 12:37:45,639] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt... +16: [2023-05-10 12:37:45,639] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt... +27: [2023-05-10 12:37:45,639] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +22: [2023-05-10 12:37:45,639] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +22: [2023-05-10 12:37:45,640] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. + 4: [2023-05-10 12:37:45,640] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt. + 4: [2023-05-10 12:37:45,640] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt. + 4: [2023-05-10 12:37:45,640] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt. +22: [2023-05-10 12:37:45,640] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt... + 4: [2023-05-10 12:37:45,640] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt. +22: [2023-05-10 12:37:45,640] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt... +21: [2023-05-10 12:37:45,641] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt. +21: [2023-05-10 12:37:45,641] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt. +21: [2023-05-10 12:37:45,641] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt. +21: [2023-05-10 12:37:45,641] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt. +16: [2023-05-10 12:37:45,641] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +27: [2023-05-10 12:37:45,642] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +25: [2023-05-10 12:37:45,642] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. + 8: [2023-05-10 12:37:45,643] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. + 8: [2023-05-10 12:37:45,643] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt... +16: [2023-05-10 12:37:45,643] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt... +22: [2023-05-10 12:37:45,643] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +22: [2023-05-10 12:37:45,643] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt... +22: [2023-05-10 12:37:45,643] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +22: [2023-05-10 12:37:45,643] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt... +25: [2023-05-10 12:37:45,644] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt... +27: [2023-05-10 12:37:45,644] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +27: [2023-05-10 12:37:45,647] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. + 0: [2023-05-10 12:37:45,648] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +15: [2023-05-10 12:37:45,648] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt. +15: [2023-05-10 12:37:45,648] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt. + 0: [2023-05-10 12:37:45,649] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +15: [2023-05-10 12:37:45,649] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt. + 0: [2023-05-10 12:37:45,649] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... + 0: [2023-05-10 12:37:45,649] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +15: [2023-05-10 12:37:45,649] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt. + 4: [2023-05-10 12:37:45,651] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... + 4: [2023-05-10 12:37:45,651] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... + 4: [2023-05-10 12:37:45,651] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... + 4: [2023-05-10 12:37:45,651] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +21: [2023-05-10 12:37:45,652] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +21: [2023-05-10 12:37:45,653] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +21: [2023-05-10 12:37:45,653] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +21: [2023-05-10 12:37:45,653] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +27: [2023-05-10 12:37:45,656] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +15: [2023-05-10 12:37:45,658] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +15: [2023-05-10 12:37:45,659] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +15: [2023-05-10 12:37:45,660] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... + 0: [2023-05-10 12:37:45,662] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. + 0: [2023-05-10 12:37:45,663] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt... +15: [2023-05-10 12:37:45,663] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... + 0: [2023-05-10 12:37:45,666] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. + 0: [2023-05-10 12:37:45,666] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. + 0: [2023-05-10 12:37:45,666] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt... + 0: [2023-05-10 12:37:45,666] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt... +21: [2023-05-10 12:37:45,667] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +21: [2023-05-10 12:37:45,667] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +21: [2023-05-10 12:37:45,668] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt... +21: [2023-05-10 12:37:45,668] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt... + 0: [2023-05-10 12:37:45,670] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. + 0: [2023-05-10 12:37:45,670] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt... +15: [2023-05-10 12:37:45,670] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. + 4: [2023-05-10 12:37:45,670] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. + 4: [2023-05-10 12:37:45,671] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. + 4: [2023-05-10 12:37:45,671] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt... + 4: [2023-05-10 12:37:45,671] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt... +15: [2023-05-10 12:37:45,671] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt... +21: [2023-05-10 12:37:45,671] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +21: [2023-05-10 12:37:45,671] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt... +21: [2023-05-10 12:37:45,673] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +21: [2023-05-10 12:37:45,673] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt... + 4: [2023-05-10 12:37:45,676] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +15: [2023-05-10 12:37:45,676] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +15: [2023-05-10 12:37:45,676] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt... +15: [2023-05-10 12:37:45,676] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +15: [2023-05-10 12:37:45,676] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt... + 4: [2023-05-10 12:37:45,677] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt... + 4: [2023-05-10 12:37:45,677] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. + 4: [2023-05-10 12:37:45,678] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt... +15: [2023-05-10 12:37:45,686] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +15: [2023-05-10 12:37:45,686] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt... + 9: [2023-05-10 12:37:45,688] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt. + 9: [2023-05-10 12:37:45,688] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt. + 9: [2023-05-10 12:37:45,688] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt. + 9: [2023-05-10 12:37:45,688] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt. + 9: [2023-05-10 12:37:45,698] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... + 9: [2023-05-10 12:37:45,700] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... + 9: [2023-05-10 12:37:45,700] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... + 9: [2023-05-10 12:37:45,700] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +31: [2023-05-10 12:37:45,700] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt. +31: [2023-05-10 12:37:45,700] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt. +31: [2023-05-10 12:37:45,700] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt. +31: [2023-05-10 12:37:45,700] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt. +27: [2023-05-10 12:37:45,705] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt. +27: [2023-05-10 12:37:45,705] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt. +27: [2023-05-10 12:37:45,705] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt. +23: [2023-05-10 12:37:45,705] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt. +23: [2023-05-10 12:37:45,705] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt. +23: [2023-05-10 12:37:45,705] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt. +23: [2023-05-10 12:37:45,706] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt. +27: [2023-05-10 12:37:45,706] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt. + 2: [2023-05-10 12:37:45,708] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt. + 2: [2023-05-10 12:37:45,708] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt. +10: [2023-05-10 12:37:45,708] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt. +10: [2023-05-10 12:37:45,708] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt. +10: [2023-05-10 12:37:45,708] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt. +10: [2023-05-10 12:37:45,709] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt. +31: [2023-05-10 12:37:45,709] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... + 2: [2023-05-10 12:37:45,709] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt. + 2: [2023-05-10 12:37:45,710] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt. +31: [2023-05-10 12:37:45,712] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +31: [2023-05-10 12:37:45,712] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +31: [2023-05-10 12:37:45,712] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... + 9: [2023-05-10 12:37:45,712] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. + 9: [2023-05-10 12:37:45,712] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt... + 7: [2023-05-10 12:37:45,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt. + 7: [2023-05-10 12:37:45,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt. + 7: [2023-05-10 12:37:45,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt. + 7: [2023-05-10 12:37:45,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt. + 9: [2023-05-10 12:37:45,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. + 9: [2023-05-10 12:37:45,715] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt... +23: [2023-05-10 12:37:45,715] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +27: [2023-05-10 12:37:45,715] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +27: [2023-05-10 12:37:45,715] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +23: [2023-05-10 12:37:45,715] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +23: [2023-05-10 12:37:45,715] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +23: [2023-05-10 12:37:45,716] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... + 9: [2023-05-10 12:37:45,716] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +27: [2023-05-10 12:37:45,716] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... + 9: [2023-05-10 12:37:45,716] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt... +27: [2023-05-10 12:37:45,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +10: [2023-05-10 12:37:45,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +10: [2023-05-10 12:37:45,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +10: [2023-05-10 12:37:45,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +10: [2023-05-10 12:37:45,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... + 2: [2023-05-10 12:37:45,720] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... + 2: [2023-05-10 12:37:45,720] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... + 2: [2023-05-10 12:37:45,720] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... + 2: [2023-05-10 12:37:45,720] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +31: [2023-05-10 12:37:45,721] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +31: [2023-05-10 12:37:45,721] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt... + 7: [2023-05-10 12:37:45,723] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... + 7: [2023-05-10 12:37:45,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... + 7: [2023-05-10 12:37:45,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... + 7: [2023-05-10 12:37:45,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +27: [2023-05-10 12:37:45,726] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +27: [2023-05-10 12:37:45,727] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt... + 9: [2023-05-10 12:37:45,730] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +31: [2023-05-10 12:37:45,730] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +23: [2023-05-10 12:37:45,730] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +23: [2023-05-10 12:37:45,730] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +31: [2023-05-10 12:37:45,730] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt... +31: [2023-05-10 12:37:45,730] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +31: [2023-05-10 12:37:45,730] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt... +31: [2023-05-10 12:37:45,730] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +31: [2023-05-10 12:37:45,730] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt... +23: [2023-05-10 12:37:45,730] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt... +23: [2023-05-10 12:37:45,730] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt... +27: [2023-05-10 12:37:45,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +27: [2023-05-10 12:37:45,731] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt... +23: [2023-05-10 12:37:45,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +23: [2023-05-10 12:37:45,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +23: [2023-05-10 12:37:45,731] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt... +23: [2023-05-10 12:37:45,731] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt... + 9: [2023-05-10 12:37:45,731] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt... +27: [2023-05-10 12:37:45,732] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +10: [2023-05-10 12:37:45,733] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +24: [2023-05-10 12:37:45,733] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt. +24: [2023-05-10 12:37:45,734] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt. +24: [2023-05-10 12:37:45,734] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt. +27: [2023-05-10 12:37:45,734] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt... +10: [2023-05-10 12:37:45,734] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt... +24: [2023-05-10 12:37:45,734] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt. +10: [2023-05-10 12:37:45,734] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +10: [2023-05-10 12:37:45,734] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt... +10: [2023-05-10 12:37:45,735] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +10: [2023-05-10 12:37:45,735] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt... + 2: [2023-05-10 12:37:45,735] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. + 2: [2023-05-10 12:37:45,736] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt... + 2: [2023-05-10 12:37:45,736] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. + 2: [2023-05-10 12:37:45,736] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt... + 7: [2023-05-10 12:37:45,737] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. + 7: [2023-05-10 12:37:45,737] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. + 7: [2023-05-10 12:37:45,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt... + 7: [2023-05-10 12:37:45,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt... + 7: [2023-05-10 12:37:45,737] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. + 7: [2023-05-10 12:37:45,738] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt... + 2: [2023-05-10 12:37:45,739] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +10: [2023-05-10 12:37:45,739] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +10: [2023-05-10 12:37:45,739] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt... + 2: [2023-05-10 12:37:45,739] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt... +27: [2023-05-10 12:37:45,741] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +27: [2023-05-10 12:37:45,742] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt... +24: [2023-05-10 12:37:45,743] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +24: [2023-05-10 12:37:45,743] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +24: [2023-05-10 12:37:45,743] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +24: [2023-05-10 12:37:45,743] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... + 7: [2023-05-10 12:37:45,744] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. + 7: [2023-05-10 12:37:45,744] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt... + 2: [2023-05-10 12:37:45,745] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. + 2: [2023-05-10 12:37:45,746] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt... + 1: [2023-05-10 12:37:45,752] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. + 1: [2023-05-10 12:37:45,752] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. + 1: [2023-05-10 12:37:45,752] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... + 1: [2023-05-10 12:37:45,752] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... + 1: [2023-05-10 12:37:45,752] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. + 1: [2023-05-10 12:37:45,752] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... + 1: [2023-05-10 12:37:45,752] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. + 1: [2023-05-10 12:37:45,752] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... + 6: [2023-05-10 12:37:45,756] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. + 6: [2023-05-10 12:37:45,756] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. + 6: [2023-05-10 12:37:45,756] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. + 6: [2023-05-10 12:37:45,756] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... + 6: [2023-05-10 12:37:45,756] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... + 6: [2023-05-10 12:37:45,756] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. + 6: [2023-05-10 12:37:45,756] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... + 6: [2023-05-10 12:37:45,757] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +12: [2023-05-10 12:37:45,764] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt. +12: [2023-05-10 12:37:45,764] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt. +12: [2023-05-10 12:37:45,764] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt. +12: [2023-05-10 12:37:45,764] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt. +13: [2023-05-10 12:37:45,765] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt. +13: [2023-05-10 12:37:45,765] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt. + 1: [2023-05-10 12:37:45,767] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. + 1: [2023-05-10 12:37:45,767] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +13: [2023-05-10 12:37:45,767] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt. +13: [2023-05-10 12:37:45,768] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_26-model_01-model_states.pt. + 1: [2023-05-10 12:37:45,769] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. + 1: [2023-05-10 12:37:45,769] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. + 6: [2023-05-10 12:37:45,770] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. + 6: [2023-05-10 12:37:45,772] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. + 6: [2023-05-10 12:37:45,772] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +12: [2023-05-10 12:37:45,774] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +12: [2023-05-10 12:37:45,774] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... + 1: [2023-05-10 12:37:45,777] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +12: [2023-05-10 12:37:45,776] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +12: [2023-05-10 12:37:45,776] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +13: [2023-05-10 12:37:45,776] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... + 1: [2023-05-10 12:37:45,778] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... + 1: [2023-05-10 12:37:45,779] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +13: [2023-05-10 12:37:45,779] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... +13: [2023-05-10 12:37:45,779] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... + 1: [2023-05-10 12:37:45,779] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +13: [2023-05-10 12:37:45,779] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt... + 6: [2023-05-10 12:37:45,780] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... + 6: [2023-05-10 12:37:45,782] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... + 6: [2023-05-10 12:37:45,782] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... + 6: [2023-05-10 12:37:45,784] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. + 4: [2023-05-10 12:37:45,784] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. + 4: [2023-05-10 12:37:45,784] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... + 4: [2023-05-10 12:37:45,784] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. + 4: [2023-05-10 12:37:45,784] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... + 4: [2023-05-10 12:37:45,787] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. + 4: [2023-05-10 12:37:45,787] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. + 4: [2023-05-10 12:37:45,787] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... + 4: [2023-05-10 12:37:45,788] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +12: [2023-05-10 12:37:45,790] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +12: [2023-05-10 12:37:45,791] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt... + 6: [2023-05-10 12:37:45,792] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +13: [2023-05-10 12:37:45,792] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +13: [2023-05-10 12:37:45,793] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt... +12: [2023-05-10 12:37:45,793] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +12: [2023-05-10 12:37:45,794] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +12: [2023-05-10 12:37:45,794] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt... +12: [2023-05-10 12:37:45,795] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt... + 6: [2023-05-10 12:37:45,797] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt. + 6: [2023-05-10 12:37:45,797] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt. + 6: [2023-05-10 12:37:45,797] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt. +13: [2023-05-10 12:37:45,798] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. + 6: [2023-05-10 12:37:45,798] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt. +13: [2023-05-10 12:37:45,798] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt... +12: [2023-05-10 12:37:45,799] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. +12: [2023-05-10 12:37:45,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt... +13: [2023-05-10 12:37:45,801] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. + 4: [2023-05-10 12:37:45,801] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. + 4: [2023-05-10 12:37:45,802] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +13: [2023-05-10 12:37:45,803] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt... +13: [2023-05-10 12:37:45,804] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_00-model_states.pt. + 4: [2023-05-10 12:37:45,805] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +13: [2023-05-10 12:37:45,806] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt... + 6: [2023-05-10 12:37:45,808] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... + 6: [2023-05-10 12:37:45,808] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... + 6: [2023-05-10 12:37:45,809] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... + 6: [2023-05-10 12:37:45,809] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... + 4: [2023-05-10 12:37:45,811] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... + 4: [2023-05-10 12:37:45,812] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... + 4: [2023-05-10 12:37:45,816] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... + 4: [2023-05-10 12:37:45,819] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. + 1: [2023-05-10 12:37:45,820] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt. + 1: [2023-05-10 12:37:45,820] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt. + 1: [2023-05-10 12:37:45,820] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt. + 1: [2023-05-10 12:37:45,820] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt. + 6: [2023-05-10 12:37:45,826] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. + 6: [2023-05-10 12:37:45,826] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. + 6: [2023-05-10 12:37:45,827] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. + 4: [2023-05-10 12:37:45,827] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... + 6: [2023-05-10 12:37:45,828] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt... + 6: [2023-05-10 12:37:45,828] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt... + 6: [2023-05-10 12:37:45,828] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt... +29: [2023-05-10 12:37:45,829] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. + 1: [2023-05-10 12:37:45,829] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +29: [2023-05-10 12:37:45,829] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +29: [2023-05-10 12:37:45,829] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +29: [2023-05-10 12:37:45,829] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +29: [2023-05-10 12:37:45,829] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +29: [2023-05-10 12:37:45,829] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. + 1: [2023-05-10 12:37:45,830] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +29: [2023-05-10 12:37:45,830] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +29: [2023-05-10 12:37:45,831] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... + 1: [2023-05-10 12:37:45,832] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... + 1: [2023-05-10 12:37:45,832] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... + 6: [2023-05-10 12:37:45,832] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. + 6: [2023-05-10 12:37:45,833] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt... +29: [2023-05-10 12:37:45,840] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +29: [2023-05-10 12:37:45,842] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. + 1: [2023-05-10 12:37:45,844] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. + 1: [2023-05-10 12:37:45,844] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. + 1: [2023-05-10 12:37:45,845] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt... + 1: [2023-05-10 12:37:45,845] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt... +28: [2023-05-10 12:37:45,845] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +28: [2023-05-10 12:37:45,845] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +28: [2023-05-10 12:37:45,845] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +28: [2023-05-10 12:37:45,845] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +28: [2023-05-10 12:37:45,845] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +28: [2023-05-10 12:37:45,845] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +28: [2023-05-10 12:37:45,845] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +28: [2023-05-10 12:37:45,847] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... + 3: [2023-05-10 12:37:45,847] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. + 3: [2023-05-10 12:37:45,847] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. + 3: [2023-05-10 12:37:45,847] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... + 3: [2023-05-10 12:37:45,847] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... + 3: [2023-05-10 12:37:45,847] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. + 3: [2023-05-10 12:37:45,848] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... + 3: [2023-05-10 12:37:45,849] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +16: [2023-05-10 12:37:45,849] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt. +16: [2023-05-10 12:37:45,850] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt. +16: [2023-05-10 12:37:45,851] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt. +29: [2023-05-10 12:37:45,851] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... + 1: [2023-05-10 12:37:45,851] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. + 1: [2023-05-10 12:37:45,851] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt... +29: [2023-05-10 12:37:45,851] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... + 3: [2023-05-10 12:37:45,851] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +16: [2023-05-10 12:37:45,852] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt. +28: [2023-05-10 12:37:45,853] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt. +28: [2023-05-10 12:37:45,854] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt. +28: [2023-05-10 12:37:45,854] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt. +29: [2023-05-10 12:37:45,856] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +28: [2023-05-10 12:37:45,857] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt. +16: [2023-05-10 12:37:45,859] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +29: [2023-05-10 12:37:45,859] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. + 1: [2023-05-10 12:37:45,859] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. + 3: [2023-05-10 12:37:45,859] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +16: [2023-05-10 12:37:45,860] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +16: [2023-05-10 12:37:45,860] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... + 1: [2023-05-10 12:37:45,861] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt... +16: [2023-05-10 12:37:45,861] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +26: [2023-05-10 12:37:45,862] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +26: [2023-05-10 12:37:45,862] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +28: [2023-05-10 12:37:45,862] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +28: [2023-05-10 12:37:45,862] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +26: [2023-05-10 12:37:45,863] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +26: [2023-05-10 12:37:45,863] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +28: [2023-05-10 12:37:45,863] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +10: [2023-05-10 12:37:45,863] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +10: [2023-05-10 12:37:45,863] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +10: [2023-05-10 12:37:45,863] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +10: [2023-05-10 12:37:45,864] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +26: [2023-05-10 12:37:45,865] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +26: [2023-05-10 12:37:45,865] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +10: [2023-05-10 12:37:45,865] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +29: [2023-05-10 12:37:45,865] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... + 3: [2023-05-10 12:37:45,865] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. + 3: [2023-05-10 12:37:45,865] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +10: [2023-05-10 12:37:45,865] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +10: [2023-05-10 12:37:45,865] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +10: [2023-05-10 12:37:45,865] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +26: [2023-05-10 12:37:45,866] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +26: [2023-05-10 12:37:45,866] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +29: [2023-05-10 12:37:45,868] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +28: [2023-05-10 12:37:45,868] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +28: [2023-05-10 12:37:45,869] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. + 3: [2023-05-10 12:37:45,869] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +28: [2023-05-10 12:37:45,869] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... + 5: [2023-05-10 12:37:45,870] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt. + 5: [2023-05-10 12:37:45,870] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt. + 5: [2023-05-10 12:37:45,870] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt. + 5: [2023-05-10 12:37:45,871] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt. +26: [2023-05-10 12:37:45,874] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +28: [2023-05-10 12:37:45,874] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +14: [2023-05-10 12:37:45,875] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt. +14: [2023-05-10 12:37:45,875] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt. + 3: [2023-05-10 12:37:45,875] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt. +14: [2023-05-10 12:37:45,875] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt. + 3: [2023-05-10 12:37:45,875] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +14: [2023-05-10 12:37:45,875] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt. + 3: [2023-05-10 12:37:45,876] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt. + 3: [2023-05-10 12:37:45,876] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt. +26: [2023-05-10 12:37:45,876] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. + 3: [2023-05-10 12:37:45,876] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +28: [2023-05-10 12:37:45,877] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +28: [2023-05-10 12:37:45,877] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt... + 3: [2023-05-10 12:37:45,879] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt. +28: [2023-05-10 12:37:45,879] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +28: [2023-05-10 12:37:45,880] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +28: [2023-05-10 12:37:45,880] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt... + 7: [2023-05-10 12:37:45,881] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. + 7: [2023-05-10 12:37:45,881] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. + 7: [2023-05-10 12:37:45,881] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... + 7: [2023-05-10 12:37:45,881] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. + 7: [2023-05-10 12:37:45,881] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +20: [2023-05-10 12:37:45,881] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt. +20: [2023-05-10 12:37:45,881] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt. + 7: [2023-05-10 12:37:45,881] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... + 7: [2023-05-10 12:37:45,881] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. + 7: [2023-05-10 12:37:45,881] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +20: [2023-05-10 12:37:45,881] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt. +20: [2023-05-10 12:37:45,882] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt. + 5: [2023-05-10 12:37:45,882] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... + 5: [2023-05-10 12:37:45,882] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... + 5: [2023-05-10 12:37:45,882] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +28: [2023-05-10 12:37:45,882] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +26: [2023-05-10 12:37:45,884] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... + 9: [2023-05-10 12:37:45,884] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. + 9: [2023-05-10 12:37:45,884] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. + 9: [2023-05-10 12:37:45,884] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... + 9: [2023-05-10 12:37:45,884] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... + 9: [2023-05-10 12:37:45,884] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. + 9: [2023-05-10 12:37:45,884] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. + 9: [2023-05-10 12:37:45,884] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... + 9: [2023-05-10 12:37:45,884] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... + 5: [2023-05-10 12:37:45,885] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +14: [2023-05-10 12:37:45,885] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... + 3: [2023-05-10 12:37:45,886] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +26: [2023-05-10 12:37:45,886] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +10: [2023-05-10 12:37:45,886] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +14: [2023-05-10 12:37:45,888] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +14: [2023-05-10 12:37:45,888] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... + 3: [2023-05-10 12:37:45,888] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... + 3: [2023-05-10 12:37:45,888] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +14: [2023-05-10 12:37:45,888] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +26: [2023-05-10 12:37:45,889] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +17: [2023-05-10 12:37:45,890] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt. +17: [2023-05-10 12:37:45,890] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt. +17: [2023-05-10 12:37:45,890] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt. +28: [2023-05-10 12:37:45,890] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +17: [2023-05-10 12:37:45,891] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt. + 3: [2023-05-10 12:37:45,891] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +28: [2023-05-10 12:37:45,891] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +20: [2023-05-10 12:37:45,892] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +20: [2023-05-10 12:37:45,892] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +10: [2023-05-10 12:37:45,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +10: [2023-05-10 12:37:45,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +10: [2023-05-10 12:37:45,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +26: [2023-05-10 12:37:45,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. + 3: [2023-05-10 12:37:45,893] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +20: [2023-05-10 12:37:45,894] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +20: [2023-05-10 12:37:45,895] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... + 7: [2023-05-10 12:37:45,895] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. + 9: [2023-05-10 12:37:45,896] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +10: [2023-05-10 12:37:45,896] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +26: [2023-05-10 12:37:45,898] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... + 9: [2023-05-10 12:37:45,898] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +28: [2023-05-10 12:37:45,898] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +28: [2023-05-10 12:37:45,898] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt... + 9: [2023-05-10 12:37:45,898] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +28: [2023-05-10 12:37:45,899] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +11: [2023-05-10 12:37:45,899] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt. + 9: [2023-05-10 12:37:45,899] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +11: [2023-05-10 12:37:45,899] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt. +11: [2023-05-10 12:37:45,899] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt. +28: [2023-05-10 12:37:45,900] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +11: [2023-05-10 12:37:45,900] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt. + 3: [2023-05-10 12:37:45,901] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +26: [2023-05-10 12:37:45,901] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt. + 7: [2023-05-10 12:37:45,901] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. + 7: [2023-05-10 12:37:45,901] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +26: [2023-05-10 12:37:45,901] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt. +28: [2023-05-10 12:37:45,901] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt... +26: [2023-05-10 12:37:45,901] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt. +10: [2023-05-10 12:37:45,902] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... + 3: [2023-05-10 12:37:45,902] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +26: [2023-05-10 12:37:45,902] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +17: [2023-05-10 12:37:45,902] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +10: [2023-05-10 12:37:45,902] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +10: [2023-05-10 12:37:45,902] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +26: [2023-05-10 12:37:45,902] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt. +17: [2023-05-10 12:37:45,903] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +17: [2023-05-10 12:37:45,903] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +17: [2023-05-10 12:37:45,903] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... + 7: [2023-05-10 12:37:45,904] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... + 9: [2023-05-10 12:37:45,905] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... + 3: [2023-05-10 12:37:45,905] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt... +25: [2023-05-10 12:37:45,905] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt. +25: [2023-05-10 12:37:45,905] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt. +25: [2023-05-10 12:37:45,905] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt. +25: [2023-05-10 12:37:45,905] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt. + 7: [2023-05-10 12:37:45,907] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. + 3: [2023-05-10 12:37:45,908] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. + 3: [2023-05-10 12:37:45,908] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt... +11: [2023-05-10 12:37:45,908] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +11: [2023-05-10 12:37:45,908] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... + 3: [2023-05-10 12:37:45,909] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. + 3: [2023-05-10 12:37:45,909] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt... +11: [2023-05-10 12:37:45,909] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +11: [2023-05-10 12:37:45,910] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... + 9: [2023-05-10 12:37:45,910] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... + 9: [2023-05-10 12:37:45,911] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... + 9: [2023-05-10 12:37:45,911] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +26: [2023-05-10 12:37:45,911] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +26: [2023-05-10 12:37:45,911] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... + 7: [2023-05-10 12:37:45,913] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... + 7: [2023-05-10 12:37:45,913] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +24: [2023-05-10 12:37:45,913] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +26: [2023-05-10 12:37:45,914] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... + 3: [2023-05-10 12:37:45,914] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +26: [2023-05-10 12:37:45,914] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +24: [2023-05-10 12:37:45,914] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +24: [2023-05-10 12:37:45,914] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +24: [2023-05-10 12:37:45,914] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +24: [2023-05-10 12:37:45,914] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +24: [2023-05-10 12:37:45,914] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +24: [2023-05-10 12:37:45,914] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +24: [2023-05-10 12:37:45,914] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +24: [2023-05-10 12:37:45,914] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt... +24: [2023-05-10 12:37:45,914] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +24: [2023-05-10 12:37:45,914] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +24: [2023-05-10 12:37:45,914] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt... +24: [2023-05-10 12:37:45,914] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt... +25: [2023-05-10 12:37:45,914] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +24: [2023-05-10 12:37:45,914] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt... +24: [2023-05-10 12:37:45,914] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. + 3: [2023-05-10 12:37:45,915] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt... +25: [2023-05-10 12:37:45,916] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +24: [2023-05-10 12:37:45,916] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... + 7: [2023-05-10 12:37:45,916] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +25: [2023-05-10 12:37:45,916] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +25: [2023-05-10 12:37:45,917] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +19: [2023-05-10 12:37:45,923] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt. +19: [2023-05-10 12:37:45,923] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt. +19: [2023-05-10 12:37:45,923] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt. +19: [2023-05-10 12:37:45,924] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt. +24: [2023-05-10 12:37:45,926] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +26: [2023-05-10 12:37:45,925] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +26: [2023-05-10 12:37:45,926] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt... +18: [2023-05-10 12:37:45,927] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt. +18: [2023-05-10 12:37:45,927] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt. +18: [2023-05-10 12:37:45,928] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt. +18: [2023-05-10 12:37:45,928] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt. +24: [2023-05-10 12:37:45,929] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +23: [2023-05-10 12:37:45,929] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +12: [2023-05-10 12:37:45,928] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +12: [2023-05-10 12:37:45,928] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +12: [2023-05-10 12:37:45,928] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +12: [2023-05-10 12:37:45,928] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +23: [2023-05-10 12:37:45,929] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +23: [2023-05-10 12:37:45,929] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +24: [2023-05-10 12:37:45,929] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +23: [2023-05-10 12:37:45,929] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +31: [2023-05-10 12:37:45,930] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +31: [2023-05-10 12:37:45,930] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +31: [2023-05-10 12:37:45,930] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +31: [2023-05-10 12:37:45,930] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +31: [2023-05-10 12:37:45,930] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +31: [2023-05-10 12:37:45,930] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +31: [2023-05-10 12:37:45,930] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +31: [2023-05-10 12:37:45,930] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +12: [2023-05-10 12:37:45,932] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +12: [2023-05-10 12:37:45,932] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +23: [2023-05-10 12:37:45,931] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +23: [2023-05-10 12:37:45,931] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +23: [2023-05-10 12:37:45,931] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +26: [2023-05-10 12:37:45,932] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +26: [2023-05-10 12:37:45,932] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +19: [2023-05-10 12:37:45,932] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +26: [2023-05-10 12:37:45,932] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +26: [2023-05-10 12:37:45,932] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt... +26: [2023-05-10 12:37:45,932] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt... +26: [2023-05-10 12:37:45,932] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt... +23: [2023-05-10 12:37:45,933] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +12: [2023-05-10 12:37:45,933] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +12: [2023-05-10 12:37:45,934] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +19: [2023-05-10 12:37:45,935] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +19: [2023-05-10 12:37:45,936] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +19: [2023-05-10 12:37:45,936] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +18: [2023-05-10 12:37:45,937] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +18: [2023-05-10 12:37:45,938] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +18: [2023-05-10 12:37:45,938] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +24: [2023-05-10 12:37:45,939] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +18: [2023-05-10 12:37:45,939] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +24: [2023-05-10 12:37:45,939] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +24: [2023-05-10 12:37:45,939] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +24: [2023-05-10 12:37:45,939] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +23: [2023-05-10 12:37:45,942] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +12: [2023-05-10 12:37:45,942] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +12: [2023-05-10 12:37:45,942] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +27: [2023-05-10 12:37:45,943] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +27: [2023-05-10 12:37:45,943] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +27: [2023-05-10 12:37:45,943] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +27: [2023-05-10 12:37:45,943] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +27: [2023-05-10 12:37:45,943] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +27: [2023-05-10 12:37:45,943] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... + 6: [2023-05-10 12:37:45,943] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. + 6: [2023-05-10 12:37:45,944] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... + 6: [2023-05-10 12:37:45,943] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. + 6: [2023-05-10 12:37:45,943] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. + 6: [2023-05-10 12:37:45,944] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... + 6: [2023-05-10 12:37:45,944] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... + 6: [2023-05-10 12:37:45,944] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. + 6: [2023-05-10 12:37:45,944] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +27: [2023-05-10 12:37:45,944] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +31: [2023-05-10 12:37:45,944] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +31: [2023-05-10 12:37:45,944] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +31: [2023-05-10 12:37:45,945] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +31: [2023-05-10 12:37:45,945] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +23: [2023-05-10 12:37:45,946] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +27: [2023-05-10 12:37:45,946] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +23: [2023-05-10 12:37:45,947] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +24: [2023-05-10 12:37:45,948] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... + 1: [2023-05-10 12:37:45,951] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. + 1: [2023-05-10 12:37:45,951] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. + 1: [2023-05-10 12:37:45,951] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... + 1: [2023-05-10 12:37:45,951] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... + 1: [2023-05-10 12:37:45,952] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. + 1: [2023-05-10 12:37:45,952] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +23: [2023-05-10 12:37:45,953] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... + 1: [2023-05-10 12:37:45,954] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +12: [2023-05-10 12:37:45,954] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +12: [2023-05-10 12:37:45,954] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... + 1: [2023-05-10 12:37:45,954] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +27: [2023-05-10 12:37:45,956] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +23: [2023-05-10 12:37:45,956] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +31: [2023-05-10 12:37:45,956] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +31: [2023-05-10 12:37:45,957] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +31: [2023-05-10 12:37:45,957] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +23: [2023-05-10 12:37:45,957] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +27: [2023-05-10 12:37:45,957] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +23: [2023-05-10 12:37:45,957] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +31: [2023-05-10 12:37:45,959] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... + 2: [2023-05-10 12:37:45,959] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. + 6: [2023-05-10 12:37:45,959] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. + 2: [2023-05-10 12:37:45,959] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. + 2: [2023-05-10 12:37:45,959] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. + 2: [2023-05-10 12:37:45,959] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... + 2: [2023-05-10 12:37:45,960] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... + 2: [2023-05-10 12:37:45,960] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. + 2: [2023-05-10 12:37:45,960] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... + 6: [2023-05-10 12:37:45,960] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. + 2: [2023-05-10 12:37:45,961] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +12: [2023-05-10 12:37:45,961] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +12: [2023-05-10 12:37:45,961] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +27: [2023-05-10 12:37:45,964] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +27: [2023-05-10 12:37:45,965] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... + 1: [2023-05-10 12:37:45,965] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. + 1: [2023-05-10 12:37:45,965] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +23: [2023-05-10 12:37:45,966] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... + 6: [2023-05-10 12:37:45,967] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +27: [2023-05-10 12:37:45,968] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... + 6: [2023-05-10 12:37:45,968] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. + 6: [2023-05-10 12:37:45,968] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... + 6: [2023-05-10 12:37:45,969] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +12: [2023-05-10 12:37:45,970] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +12: [2023-05-10 12:37:45,970] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... + 2: [2023-05-10 12:37:45,970] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. + 2: [2023-05-10 12:37:45,972] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. + 2: [2023-05-10 12:37:45,974] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +27: [2023-05-10 12:37:45,975] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... + 1: [2023-05-10 12:37:45,976] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... + 1: [2023-05-10 12:37:45,977] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +27: [2023-05-10 12:37:45,977] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. + 6: [2023-05-10 12:37:45,977] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... + 6: [2023-05-10 12:37:45,978] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... + 2: [2023-05-10 12:37:45,979] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +15: [2023-05-10 12:37:45,980] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt. +15: [2023-05-10 12:37:45,980] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt. +15: [2023-05-10 12:37:45,980] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt. + 1: [2023-05-10 12:37:45,980] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +15: [2023-05-10 12:37:45,980] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt. + 2: [2023-05-10 12:37:45,981] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... + 2: [2023-05-10 12:37:45,984] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +27: [2023-05-10 12:37:45,985] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... + 1: [2023-05-10 12:37:45,985] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. + 1: [2023-05-10 12:37:45,988] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... + 2: [2023-05-10 12:37:45,989] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +15: [2023-05-10 12:37:45,991] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +15: [2023-05-10 12:37:45,992] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +15: [2023-05-10 12:37:45,992] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... + 1: [2023-05-10 12:37:45,994] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +15: [2023-05-10 12:37:45,995] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +29: [2023-05-10 12:37:45,997] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt. +29: [2023-05-10 12:37:45,997] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt. +29: [2023-05-10 12:37:45,997] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt. + 2: [2023-05-10 12:37:45,998] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +29: [2023-05-10 12:37:45,998] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt. +31: [2023-05-10 12:37:46,000] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt. +31: [2023-05-10 12:37:46,000] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt. +31: [2023-05-10 12:37:46,000] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt. +31: [2023-05-10 12:37:46,000] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt. + 8: [2023-05-10 12:37:46,000] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt. + 8: [2023-05-10 12:37:46,000] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt. + 8: [2023-05-10 12:37:46,000] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt. + 8: [2023-05-10 12:37:46,000] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt. + 4: [2023-05-10 12:37:46,005] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. + 4: [2023-05-10 12:37:46,005] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +21: [2023-05-10 12:37:46,005] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt. + 4: [2023-05-10 12:37:46,005] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... + 4: [2023-05-10 12:37:46,005] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... + 4: [2023-05-10 12:37:46,005] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +21: [2023-05-10 12:37:46,005] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt. +21: [2023-05-10 12:37:46,005] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt. + 4: [2023-05-10 12:37:46,005] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... + 4: [2023-05-10 12:37:46,005] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +21: [2023-05-10 12:37:46,005] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt. +29: [2023-05-10 12:37:46,006] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +29: [2023-05-10 12:37:46,007] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... + 4: [2023-05-10 12:37:46,007] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +28: [2023-05-10 12:37:46,008] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +28: [2023-05-10 12:37:46,008] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +28: [2023-05-10 12:37:46,008] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +28: [2023-05-10 12:37:46,008] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +28: [2023-05-10 12:37:46,008] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +28: [2023-05-10 12:37:46,008] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... + 2: [2023-05-10 12:37:46,008] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt. + 2: [2023-05-10 12:37:46,008] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt. +28: [2023-05-10 12:37:46,009] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. + 2: [2023-05-10 12:37:46,009] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt. +29: [2023-05-10 12:37:46,009] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... + 2: [2023-05-10 12:37:46,009] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt. +31: [2023-05-10 12:37:46,009] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +29: [2023-05-10 12:37:46,009] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +10: [2023-05-10 12:37:46,009] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt. +31: [2023-05-10 12:37:46,010] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +10: [2023-05-10 12:37:46,010] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt. + 9: [2023-05-10 12:37:46,010] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt. + 9: [2023-05-10 12:37:46,010] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt. +10: [2023-05-10 12:37:46,010] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt. + 8: [2023-05-10 12:37:46,010] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +10: [2023-05-10 12:37:46,010] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt. + 8: [2023-05-10 12:37:46,010] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... + 8: [2023-05-10 12:37:46,010] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +22: [2023-05-10 12:37:46,010] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt. + 8: [2023-05-10 12:37:46,010] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... + 9: [2023-05-10 12:37:46,010] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt. +22: [2023-05-10 12:37:46,010] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt. +31: [2023-05-10 12:37:46,010] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... + 9: [2023-05-10 12:37:46,010] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt. +22: [2023-05-10 12:37:46,011] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt. +28: [2023-05-10 12:37:46,010] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +22: [2023-05-10 12:37:46,011] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt. +30: [2023-05-10 12:37:46,012] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt. +30: [2023-05-10 12:37:46,012] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt. +30: [2023-05-10 12:37:46,012] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt. +30: [2023-05-10 12:37:46,012] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt. + 7: [2023-05-10 12:37:46,012] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt. + 7: [2023-05-10 12:37:46,013] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt. + 7: [2023-05-10 12:37:46,013] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt. + 4: [2023-05-10 12:37:46,013] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt. + 4: [2023-05-10 12:37:46,013] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt. +27: [2023-05-10 12:37:46,013] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt. +27: [2023-05-10 12:37:46,013] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt. + 7: [2023-05-10 12:37:46,013] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt. + 4: [2023-05-10 12:37:46,013] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt. +27: [2023-05-10 12:37:46,013] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt. + 4: [2023-05-10 12:37:46,013] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt. +27: [2023-05-10 12:37:46,014] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt. +31: [2023-05-10 12:37:46,014] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... + 0: [2023-05-10 12:37:46,014] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt. + 0: [2023-05-10 12:37:46,014] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt. + 0: [2023-05-10 12:37:46,014] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt. + 0: [2023-05-10 12:37:46,015] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt. +21: [2023-05-10 12:37:46,015] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +21: [2023-05-10 12:37:46,015] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +21: [2023-05-10 12:37:46,015] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +21: [2023-05-10 12:37:46,015] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +23: [2023-05-10 12:37:46,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt. +23: [2023-05-10 12:37:46,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt. +23: [2023-05-10 12:37:46,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt. +23: [2023-05-10 12:37:46,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt. +30: [2023-05-10 12:37:46,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +30: [2023-05-10 12:37:46,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +30: [2023-05-10 12:37:46,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +30: [2023-05-10 12:37:46,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +30: [2023-05-10 12:37:46,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +30: [2023-05-10 12:37:46,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... + 2: [2023-05-10 12:37:46,018] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +30: [2023-05-10 12:37:46,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +30: [2023-05-10 12:37:46,019] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... + 2: [2023-05-10 12:37:46,019] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +10: [2023-05-10 12:37:46,019] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +10: [2023-05-10 12:37:46,019] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +10: [2023-05-10 12:37:46,019] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... + 9: [2023-05-10 12:37:46,020] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... + 9: [2023-05-10 12:37:46,020] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... + 2: [2023-05-10 12:37:46,020] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... + 9: [2023-05-10 12:37:46,021] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... + 2: [2023-05-10 12:37:46,021] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... + 9: [2023-05-10 12:37:46,021] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... + 8: [2023-05-10 12:37:46,021] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +30: [2023-05-10 12:37:46,021] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... + 8: [2023-05-10 12:37:46,022] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... + 7: [2023-05-10 12:37:46,022] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +30: [2023-05-10 12:37:46,022] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... + 8: [2023-05-10 12:37:46,022] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. + 8: [2023-05-10 12:37:46,022] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. + 8: [2023-05-10 12:37:46,022] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +10: [2023-05-10 12:37:46,022] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... + 4: [2023-05-10 12:37:46,022] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. + 8: [2023-05-10 12:37:46,022] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... + 8: [2023-05-10 12:37:46,022] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +22: [2023-05-10 12:37:46,022] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +22: [2023-05-10 12:37:46,022] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +22: [2023-05-10 12:37:46,022] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +26: [2023-05-10 12:37:46,022] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +26: [2023-05-10 12:37:46,022] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +26: [2023-05-10 12:37:46,022] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +26: [2023-05-10 12:37:46,022] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... + 4: [2023-05-10 12:37:46,022] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +31: [2023-05-10 12:37:46,022] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. + 4: [2023-05-10 12:37:46,023] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +31: [2023-05-10 12:37:46,023] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt... +26: [2023-05-10 12:37:46,023] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +26: [2023-05-10 12:37:46,023] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +26: [2023-05-10 12:37:46,023] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +26: [2023-05-10 12:37:46,023] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +30: [2023-05-10 12:37:46,023] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +27: [2023-05-10 12:37:46,024] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... + 4: [2023-05-10 12:37:46,024] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +27: [2023-05-10 12:37:46,024] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +27: [2023-05-10 12:37:46,024] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... + 8: [2023-05-10 12:37:46,024] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... + 4: [2023-05-10 12:37:46,024] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +30: [2023-05-10 12:37:46,024] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... + 0: [2023-05-10 12:37:46,024] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... + 4: [2023-05-10 12:37:46,024] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. + 4: [2023-05-10 12:37:46,024] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +22: [2023-05-10 12:37:46,025] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... + 0: [2023-05-10 12:37:46,025] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... + 7: [2023-05-10 12:37:46,025] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... + 7: [2023-05-10 12:37:46,025] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +23: [2023-05-10 12:37:46,025] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +23: [2023-05-10 12:37:46,025] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +29: [2023-05-10 12:37:46,025] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +29: [2023-05-10 12:37:46,025] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +28: [2023-05-10 12:37:46,025] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +28: [2023-05-10 12:37:46,025] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. + 0: [2023-05-10 12:37:46,026] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +29: [2023-05-10 12:37:46,026] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt... +27: [2023-05-10 12:37:46,026] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +29: [2023-05-10 12:37:46,026] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt... + 0: [2023-05-10 12:37:46,026] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +29: [2023-05-10 12:37:46,027] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +29: [2023-05-10 12:37:46,027] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt... +23: [2023-05-10 12:37:46,027] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... + 7: [2023-05-10 12:37:46,027] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +23: [2023-05-10 12:37:46,028] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +31: [2023-05-10 12:37:46,029] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +31: [2023-05-10 12:37:46,029] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt... +31: [2023-05-10 12:37:46,029] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +31: [2023-05-10 12:37:46,029] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt... + 2: [2023-05-10 12:37:46,031] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. + 8: [2023-05-10 12:37:46,031] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. + 8: [2023-05-10 12:37:46,031] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. + 8: [2023-05-10 12:37:46,032] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. + 4: [2023-05-10 12:37:46,032] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... + 2: [2023-05-10 12:37:46,032] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt... + 8: [2023-05-10 12:37:46,033] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt... + 8: [2023-05-10 12:37:46,033] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt... + 8: [2023-05-10 12:37:46,033] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt... +28: [2023-05-10 12:37:46,033] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. + 9: [2023-05-10 12:37:46,033] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +10: [2023-05-10 12:37:46,033] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. + 9: [2023-05-10 12:37:46,034] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt... +10: [2023-05-10 12:37:46,034] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt... +30: [2023-05-10 12:37:46,034] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +28: [2023-05-10 12:37:46,034] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... + 4: [2023-05-10 12:37:46,035] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... + 4: [2023-05-10 12:37:46,035] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +10: [2023-05-10 12:37:46,035] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +10: [2023-05-10 12:37:46,036] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt... + 2: [2023-05-10 12:37:46,036] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +31: [2023-05-10 12:37:46,036] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. + 7: [2023-05-10 12:37:46,035] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. + 8: [2023-05-10 12:37:46,036] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. + 2: [2023-05-10 12:37:46,036] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt... +28: [2023-05-10 12:37:46,036] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... + 7: [2023-05-10 12:37:46,036] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt... +30: [2023-05-10 12:37:46,036] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. + 7: [2023-05-10 12:37:46,037] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. + 7: [2023-05-10 12:37:46,037] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt... +26: [2023-05-10 12:37:46,037] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +29: [2023-05-10 12:37:46,037] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. + 9: [2023-05-10 12:37:46,038] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. + 9: [2023-05-10 12:37:46,038] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt... +26: [2023-05-10 12:37:46,038] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +28: [2023-05-10 12:37:46,038] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +31: [2023-05-10 12:37:46,038] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt... +29: [2023-05-10 12:37:46,038] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt... + 8: [2023-05-10 12:37:46,039] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +27: [2023-05-10 12:37:46,039] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. + 8: [2023-05-10 12:37:46,039] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt... + 9: [2023-05-10 12:37:46,039] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. + 9: [2023-05-10 12:37:46,039] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt... + 4: [2023-05-10 12:37:46,039] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +27: [2023-05-10 12:37:46,039] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt... + 9: [2023-05-10 12:37:46,039] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. + 9: [2023-05-10 12:37:46,039] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt... +30: [2023-05-10 12:37:46,039] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +30: [2023-05-10 12:37:46,039] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. + 4: [2023-05-10 12:37:46,039] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. + 4: [2023-05-10 12:37:46,040] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +26: [2023-05-10 12:37:46,040] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +10: [2023-05-10 12:37:46,040] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +10: [2023-05-10 12:37:46,040] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt... + 4: [2023-05-10 12:37:46,040] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt... + 4: [2023-05-10 12:37:46,040] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt... +27: [2023-05-10 12:37:46,040] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +27: [2023-05-10 12:37:46,040] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt... +23: [2023-05-10 12:37:46,041] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +26: [2023-05-10 12:37:46,041] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +23: [2023-05-10 12:37:46,042] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt... + 4: [2023-05-10 12:37:46,042] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +23: [2023-05-10 12:37:46,042] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. + 4: [2023-05-10 12:37:46,042] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt... +30: [2023-05-10 12:37:46,041] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +28: [2023-05-10 12:37:46,042] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +30: [2023-05-10 12:37:46,042] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt... +27: [2023-05-10 12:37:46,042] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +27: [2023-05-10 12:37:46,042] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +27: [2023-05-10 12:37:46,043] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt... +23: [2023-05-10 12:37:46,043] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt... +10: [2023-05-10 12:37:46,043] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +27: [2023-05-10 12:37:46,043] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt... +30: [2023-05-10 12:37:46,044] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... + 2: [2023-05-10 12:37:46,044] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +13: [2023-05-10 12:37:46,044] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt. +13: [2023-05-10 12:37:46,044] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt. +13: [2023-05-10 12:37:46,044] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt. +13: [2023-05-10 12:37:46,044] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt. +10: [2023-05-10 12:37:46,045] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt... + 8: [2023-05-10 12:37:46,045] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. + 2: [2023-05-10 12:37:46,045] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. + 2: [2023-05-10 12:37:46,046] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt... + 8: [2023-05-10 12:37:46,046] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... + 8: [2023-05-10 12:37:46,046] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +26: [2023-05-10 12:37:46,046] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +28: [2023-05-10 12:37:46,046] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +30: [2023-05-10 12:37:46,047] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +30: [2023-05-10 12:37:46,047] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt... + 2: [2023-05-10 12:37:46,047] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt... + 4: [2023-05-10 12:37:46,047] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. + 4: [2023-05-10 12:37:46,048] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt... +30: [2023-05-10 12:37:46,048] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... + 4: [2023-05-10 12:37:46,048] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +26: [2023-05-10 12:37:46,049] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... + 7: [2023-05-10 12:37:46,049] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. + 7: [2023-05-10 12:37:46,050] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. + 7: [2023-05-10 12:37:46,050] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt... +23: [2023-05-10 12:37:46,051] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +30: [2023-05-10 12:37:46,052] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +30: [2023-05-10 12:37:46,052] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... + 7: [2023-05-10 12:37:46,052] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt... +26: [2023-05-10 12:37:46,052] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +30: [2023-05-10 12:37:46,053] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +23: [2023-05-10 12:37:46,053] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt... +13: [2023-05-10 12:37:46,054] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +13: [2023-05-10 12:37:46,054] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +13: [2023-05-10 12:37:46,054] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +30: [2023-05-10 12:37:46,054] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt... +26: [2023-05-10 12:37:46,055] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... + 8: [2023-05-10 12:37:46,055] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +23: [2023-05-10 12:37:46,056] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +13: [2023-05-10 12:37:46,057] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +30: [2023-05-10 12:37:46,057] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. + 8: [2023-05-10 12:37:46,057] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +23: [2023-05-10 12:37:46,058] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt... +30: [2023-05-10 12:37:46,058] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt... + 8: [2023-05-10 12:37:46,061] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +12: [2023-05-10 12:37:46,062] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt. +12: [2023-05-10 12:37:46,062] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt. +12: [2023-05-10 12:37:46,062] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt. +12: [2023-05-10 12:37:46,062] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_27-model_01-model_states.pt. +17: [2023-05-10 12:37:46,064] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +17: [2023-05-10 12:37:46,064] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +17: [2023-05-10 12:37:46,064] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +17: [2023-05-10 12:37:46,064] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +17: [2023-05-10 12:37:46,064] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt... +16: [2023-05-10 12:37:46,064] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +16: [2023-05-10 12:37:46,064] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +16: [2023-05-10 12:37:46,064] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +16: [2023-05-10 12:37:46,064] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +16: [2023-05-10 12:37:46,064] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +16: [2023-05-10 12:37:46,064] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +16: [2023-05-10 12:37:46,064] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +16: [2023-05-10 12:37:46,064] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +16: [2023-05-10 12:37:46,065] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +16: [2023-05-10 12:37:46,065] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +16: [2023-05-10 12:37:46,065] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt... +16: [2023-05-10 12:37:46,065] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt... +16: [2023-05-10 12:37:46,065] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt... +16: [2023-05-10 12:37:46,065] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt... +17: [2023-05-10 12:37:46,065] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +17: [2023-05-10 12:37:46,065] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +16: [2023-05-10 12:37:46,065] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +17: [2023-05-10 12:37:46,065] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +17: [2023-05-10 12:37:46,065] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +17: [2023-05-10 12:37:46,066] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt... +17: [2023-05-10 12:37:46,065] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +17: [2023-05-10 12:37:46,066] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt... +17: [2023-05-10 12:37:46,067] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +17: [2023-05-10 12:37:46,067] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt... +17: [2023-05-10 12:37:46,067] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +16: [2023-05-10 12:37:46,067] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +17: [2023-05-10 12:37:46,068] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +22: [2023-05-10 12:37:46,068] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +22: [2023-05-10 12:37:46,069] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +22: [2023-05-10 12:37:46,069] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +22: [2023-05-10 12:37:46,069] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +22: [2023-05-10 12:37:46,069] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +22: [2023-05-10 12:37:46,069] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +22: [2023-05-10 12:37:46,069] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt... +22: [2023-05-10 12:37:46,069] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +22: [2023-05-10 12:37:46,069] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +22: [2023-05-10 12:37:46,069] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt... +22: [2023-05-10 12:37:46,069] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt... +22: [2023-05-10 12:37:46,069] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... + 8: [2023-05-10 12:37:46,070] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +22: [2023-05-10 12:37:46,070] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +22: [2023-05-10 12:37:46,070] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +22: [2023-05-10 12:37:46,071] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt... +22: [2023-05-10 12:37:46,071] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +12: [2023-05-10 12:37:46,071] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +12: [2023-05-10 12:37:46,071] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... + 3: [2023-05-10 12:37:46,071] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. + 3: [2023-05-10 12:37:46,071] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. + 3: [2023-05-10 12:37:46,071] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... + 3: [2023-05-10 12:37:46,071] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +12: [2023-05-10 12:37:46,072] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... + 3: [2023-05-10 12:37:46,072] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +12: [2023-05-10 12:37:46,072] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... + 3: [2023-05-10 12:37:46,072] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. + 3: [2023-05-10 12:37:46,073] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... + 3: [2023-05-10 12:37:46,073] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +17: [2023-05-10 12:37:46,075] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. + 0: [2023-05-10 12:37:46,079] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. + 0: [2023-05-10 12:37:46,079] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. + 0: [2023-05-10 12:37:46,079] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. + 0: [2023-05-10 12:37:46,079] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. + 0: [2023-05-10 12:37:46,079] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. + 0: [2023-05-10 12:37:46,079] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. + 0: [2023-05-10 12:37:46,079] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. + 0: [2023-05-10 12:37:46,080] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... + 0: [2023-05-10 12:37:46,080] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... + 0: [2023-05-10 12:37:46,080] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +16: [2023-05-10 12:37:46,079] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +16: [2023-05-10 12:37:46,080] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. + 0: [2023-05-10 12:37:46,080] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt... + 0: [2023-05-10 12:37:46,081] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. + 0: [2023-05-10 12:37:46,081] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt... + 0: [2023-05-10 12:37:46,081] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt... + 0: [2023-05-10 12:37:46,082] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... + 0: [2023-05-10 12:37:46,083] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt... +12: [2023-05-10 12:37:46,084] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +12: [2023-05-10 12:37:46,084] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +12: [2023-05-10 12:37:46,084] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt... +12: [2023-05-10 12:37:46,085] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt... +17: [2023-05-10 12:37:46,085] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +12: [2023-05-10 12:37:46,085] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +12: [2023-05-10 12:37:46,086] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt... +12: [2023-05-10 12:37:46,086] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +12: [2023-05-10 12:37:46,086] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt... +17: [2023-05-10 12:37:46,086] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +22: [2023-05-10 12:37:46,088] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +22: [2023-05-10 12:37:46,088] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +16: [2023-05-10 12:37:46,088] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +16: [2023-05-10 12:37:46,088] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +22: [2023-05-10 12:37:46,089] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +16: [2023-05-10 12:37:46,089] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... + 3: [2023-05-10 12:37:46,089] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. + 3: [2023-05-10 12:37:46,090] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +17: [2023-05-10 12:37:46,091] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +17: [2023-05-10 12:37:46,095] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +11: [2023-05-10 12:37:46,096] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +11: [2023-05-10 12:37:46,096] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +11: [2023-05-10 12:37:46,096] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +11: [2023-05-10 12:37:46,096] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +16: [2023-05-10 12:37:46,096] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +11: [2023-05-10 12:37:46,096] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +11: [2023-05-10 12:37:46,096] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +11: [2023-05-10 12:37:46,096] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +11: [2023-05-10 12:37:46,097] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +11: [2023-05-10 12:37:46,097] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt... +11: [2023-05-10 12:37:46,097] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt... +11: [2023-05-10 12:37:46,097] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt... +11: [2023-05-10 12:37:46,097] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... + 6: [2023-05-10 12:37:46,097] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt. + 6: [2023-05-10 12:37:46,097] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt. + 6: [2023-05-10 12:37:46,097] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt. + 6: [2023-05-10 12:37:46,097] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt. +11: [2023-05-10 12:37:46,097] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +11: [2023-05-10 12:37:46,098] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +11: [2023-05-10 12:37:46,098] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +11: [2023-05-10 12:37:46,098] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt... +22: [2023-05-10 12:37:46,098] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +22: [2023-05-10 12:37:46,098] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +22: [2023-05-10 12:37:46,098] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +16: [2023-05-10 12:37:46,099] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +17: [2023-05-10 12:37:46,099] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +17: [2023-05-10 12:37:46,100] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... + 3: [2023-05-10 12:37:46,100] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... + 3: [2023-05-10 12:37:46,100] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. + 3: [2023-05-10 12:37:46,100] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... + 0: [2023-05-10 12:37:46,101] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. + 0: [2023-05-10 12:37:46,101] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +22: [2023-05-10 12:37:46,101] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +14: [2023-05-10 12:37:46,101] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +14: [2023-05-10 12:37:46,101] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +14: [2023-05-10 12:37:46,102] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +20: [2023-05-10 12:37:46,102] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +20: [2023-05-10 12:37:46,102] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +14: [2023-05-10 12:37:46,102] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +14: [2023-05-10 12:37:46,102] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +14: [2023-05-10 12:37:46,102] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +14: [2023-05-10 12:37:46,102] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt... +14: [2023-05-10 12:37:46,102] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +14: [2023-05-10 12:37:46,102] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt... +14: [2023-05-10 12:37:46,102] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +20: [2023-05-10 12:37:46,102] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +20: [2023-05-10 12:37:46,102] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +20: [2023-05-10 12:37:46,102] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +20: [2023-05-10 12:37:46,102] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt... +20: [2023-05-10 12:37:46,102] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt... +20: [2023-05-10 12:37:46,102] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +20: [2023-05-10 12:37:46,102] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +20: [2023-05-10 12:37:46,103] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +20: [2023-05-10 12:37:46,103] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +25: [2023-05-10 12:37:46,103] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +25: [2023-05-10 12:37:46,103] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +25: [2023-05-10 12:37:46,103] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +25: [2023-05-10 12:37:46,103] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +25: [2023-05-10 12:37:46,103] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +20: [2023-05-10 12:37:46,103] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +20: [2023-05-10 12:37:46,103] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +25: [2023-05-10 12:37:46,104] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt... +14: [2023-05-10 12:37:46,104] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +14: [2023-05-10 12:37:46,104] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +14: [2023-05-10 12:37:46,104] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. + 5: [2023-05-10 12:37:46,104] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. + 5: [2023-05-10 12:37:46,105] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt... + 5: [2023-05-10 12:37:46,105] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +19: [2023-05-10 12:37:46,105] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +19: [2023-05-10 12:37:46,105] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +19: [2023-05-10 12:37:46,105] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +19: [2023-05-10 12:37:46,105] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. + 5: [2023-05-10 12:37:46,105] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt... +19: [2023-05-10 12:37:46,105] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +19: [2023-05-10 12:37:46,105] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +19: [2023-05-10 12:37:46,105] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +19: [2023-05-10 12:37:46,105] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +19: [2023-05-10 12:37:46,105] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +19: [2023-05-10 12:37:46,105] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +20: [2023-05-10 12:37:46,105] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +19: [2023-05-10 12:37:46,105] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +19: [2023-05-10 12:37:46,105] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +19: [2023-05-10 12:37:46,105] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt... +19: [2023-05-10 12:37:46,105] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt... +14: [2023-05-10 12:37:46,106] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt... +20: [2023-05-10 12:37:46,105] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt... + 6: [2023-05-10 12:37:46,106] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +20: [2023-05-10 12:37:46,106] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt... +21: [2023-05-10 12:37:46,106] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. + 5: [2023-05-10 12:37:46,106] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. + 5: [2023-05-10 12:37:46,106] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. + 6: [2023-05-10 12:37:46,106] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... + 5: [2023-05-10 12:37:46,106] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt... + 5: [2023-05-10 12:37:46,106] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +18: [2023-05-10 12:37:46,106] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +18: [2023-05-10 12:37:46,106] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +21: [2023-05-10 12:37:46,106] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +14: [2023-05-10 12:37:46,106] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt... +21: [2023-05-10 12:37:46,106] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. + 5: [2023-05-10 12:37:46,106] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. + 5: [2023-05-10 12:37:46,106] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +21: [2023-05-10 12:37:46,106] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +14: [2023-05-10 12:37:46,106] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... + 6: [2023-05-10 12:37:46,106] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +21: [2023-05-10 12:37:46,106] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt... +21: [2023-05-10 12:37:46,106] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt... +19: [2023-05-10 12:37:46,106] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt... +21: [2023-05-10 12:37:46,106] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +21: [2023-05-10 12:37:46,107] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +18: [2023-05-10 12:37:46,107] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt... +18: [2023-05-10 12:37:46,107] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt... +21: [2023-05-10 12:37:46,107] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +21: [2023-05-10 12:37:46,107] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +21: [2023-05-10 12:37:46,107] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +21: [2023-05-10 12:37:46,107] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +21: [2023-05-10 12:37:46,107] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +13: [2023-05-10 12:37:46,107] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +13: [2023-05-10 12:37:46,107] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +13: [2023-05-10 12:37:46,107] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +21: [2023-05-10 12:37:46,107] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt... +18: [2023-05-10 12:37:46,107] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +18: [2023-05-10 12:37:46,107] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +18: [2023-05-10 12:37:46,107] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +18: [2023-05-10 12:37:46,107] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +18: [2023-05-10 12:37:46,107] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +18: [2023-05-10 12:37:46,107] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +13: [2023-05-10 12:37:46,107] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +19: [2023-05-10 12:37:46,107] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt... +18: [2023-05-10 12:37:46,107] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +18: [2023-05-10 12:37:46,107] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt... +18: [2023-05-10 12:37:46,107] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +18: [2023-05-10 12:37:46,107] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +13: [2023-05-10 12:37:46,107] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +13: [2023-05-10 12:37:46,107] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +13: [2023-05-10 12:37:46,107] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt... +13: [2023-05-10 12:37:46,107] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. + 5: [2023-05-10 12:37:46,107] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +13: [2023-05-10 12:37:46,107] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. + 5: [2023-05-10 12:37:46,107] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +13: [2023-05-10 12:37:46,107] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +13: [2023-05-10 12:37:46,107] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt... +13: [2023-05-10 12:37:46,107] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt... +13: [2023-05-10 12:37:46,107] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... + 6: [2023-05-10 12:37:46,107] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +25: [2023-05-10 12:37:46,107] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +25: [2023-05-10 12:37:46,108] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. + 5: [2023-05-10 12:37:46,108] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +22: [2023-05-10 12:37:46,108] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... + 5: [2023-05-10 12:37:46,108] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +25: [2023-05-10 12:37:46,108] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +25: [2023-05-10 12:37:46,108] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +25: [2023-05-10 12:37:46,108] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. + 3: [2023-05-10 12:37:46,108] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +17: [2023-05-10 12:37:46,108] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +21: [2023-05-10 12:37:46,108] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt... +21: [2023-05-10 12:37:46,108] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +13: [2023-05-10 12:37:46,109] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt... +18: [2023-05-10 12:37:46,109] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... + 3: [2023-05-10 12:37:46,109] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +16: [2023-05-10 12:37:46,109] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... + 5: [2023-05-10 12:37:46,109] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt... +25: [2023-05-10 12:37:46,109] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt... +25: [2023-05-10 12:37:46,109] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt... +13: [2023-05-10 12:37:46,109] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... + 5: [2023-05-10 12:37:46,109] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +18: [2023-05-10 12:37:46,109] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt... +25: [2023-05-10 12:37:46,110] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +25: [2023-05-10 12:37:46,110] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +25: [2023-05-10 12:37:46,110] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt... +13: [2023-05-10 12:37:46,110] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... + 0: [2023-05-10 12:37:46,111] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. + 0: [2023-05-10 12:37:46,111] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... + 0: [2023-05-10 12:37:46,111] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +11: [2023-05-10 12:37:46,112] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +11: [2023-05-10 12:37:46,112] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +11: [2023-05-10 12:37:46,113] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +11: [2023-05-10 12:37:46,113] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. + 1: [2023-05-10 12:37:46,114] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt. + 1: [2023-05-10 12:37:46,114] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt. + 1: [2023-05-10 12:37:46,114] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt. + 1: [2023-05-10 12:37:46,114] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt. +14: [2023-05-10 12:37:46,114] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +25: [2023-05-10 12:37:46,115] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +20: [2023-05-10 12:37:46,115] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +25: [2023-05-10 12:37:46,117] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +19: [2023-05-10 12:37:46,117] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +14: [2023-05-10 12:37:46,118] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +14: [2023-05-10 12:37:46,118] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. + 3: [2023-05-10 12:37:46,119] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +20: [2023-05-10 12:37:46,119] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +20: [2023-05-10 12:37:46,119] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +21: [2023-05-10 12:37:46,119] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. + 5: [2023-05-10 12:37:46,120] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +21: [2023-05-10 12:37:46,120] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +21: [2023-05-10 12:37:46,120] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. + 0: [2023-05-10 12:37:46,120] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +19: [2023-05-10 12:37:46,120] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +13: [2023-05-10 12:37:46,121] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +19: [2023-05-10 12:37:46,121] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +11: [2023-05-10 12:37:46,122] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... + 0: [2023-05-10 12:37:46,122] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +11: [2023-05-10 12:37:46,123] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... + 6: [2023-05-10 12:37:46,122] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. + 6: [2023-05-10 12:37:46,123] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt... +19: [2023-05-10 12:37:46,123] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +13: [2023-05-10 12:37:46,123] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. + 1: [2023-05-10 12:37:46,123] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +20: [2023-05-10 12:37:46,125] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +14: [2023-05-10 12:37:46,125] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +11: [2023-05-10 12:37:46,125] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +11: [2023-05-10 12:37:46,125] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +29: [2023-05-10 12:37:46,125] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +29: [2023-05-10 12:37:46,125] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +29: [2023-05-10 12:37:46,125] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +29: [2023-05-10 12:37:46,125] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +25: [2023-05-10 12:37:46,126] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... + 1: [2023-05-10 12:37:46,126] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... + 1: [2023-05-10 12:37:46,126] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... + 1: [2023-05-10 12:37:46,126] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... + 9: [2023-05-10 12:37:46,126] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. + 9: [2023-05-10 12:37:46,126] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... + 9: [2023-05-10 12:37:46,126] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. + 9: [2023-05-10 12:37:46,126] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. + 9: [2023-05-10 12:37:46,126] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... + 9: [2023-05-10 12:37:46,126] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... + 9: [2023-05-10 12:37:46,126] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. + 6: [2023-05-10 12:37:46,126] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. + 6: [2023-05-10 12:37:46,126] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. + 6: [2023-05-10 12:37:46,126] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt... + 6: [2023-05-10 12:37:46,126] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt... +19: [2023-05-10 12:37:46,127] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +14: [2023-05-10 12:37:46,128] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +14: [2023-05-10 12:37:46,128] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +25: [2023-05-10 12:37:46,128] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... + 9: [2023-05-10 12:37:46,128] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +29: [2023-05-10 12:37:46,128] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +29: [2023-05-10 12:37:46,128] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +29: [2023-05-10 12:37:46,128] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +20: [2023-05-10 12:37:46,128] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +21: [2023-05-10 12:37:46,129] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +19: [2023-05-10 12:37:46,129] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +18: [2023-05-10 12:37:46,129] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +18: [2023-05-10 12:37:46,129] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +18: [2023-05-10 12:37:46,129] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +29: [2023-05-10 12:37:46,129] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +13: [2023-05-10 12:37:46,129] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +26: [2023-05-10 12:37:46,130] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt. +26: [2023-05-10 12:37:46,130] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt. +26: [2023-05-10 12:37:46,130] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt. +20: [2023-05-10 12:37:46,130] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +26: [2023-05-10 12:37:46,130] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt. +19: [2023-05-10 12:37:46,130] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +21: [2023-05-10 12:37:46,130] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +21: [2023-05-10 12:37:46,131] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... + 5: [2023-05-10 12:37:46,131] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... + 0: [2023-05-10 12:37:46,131] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +19: [2023-05-10 12:37:46,132] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +20: [2023-05-10 12:37:46,132] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. + 5: [2023-05-10 12:37:46,132] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. + 5: [2023-05-10 12:37:46,132] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +21: [2023-05-10 12:37:46,134] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +13: [2023-05-10 12:37:46,134] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +14: [2023-05-10 12:37:46,135] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. + 5: [2023-05-10 12:37:46,136] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +25: [2023-05-10 12:37:46,136] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +25: [2023-05-10 12:37:46,136] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +15: [2023-05-10 12:37:46,136] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +15: [2023-05-10 12:37:46,137] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +15: [2023-05-10 12:37:46,137] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +15: [2023-05-10 12:37:46,137] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +15: [2023-05-10 12:37:46,137] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +15: [2023-05-10 12:37:46,137] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... + 6: [2023-05-10 12:37:46,137] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +15: [2023-05-10 12:37:46,137] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt... +15: [2023-05-10 12:37:46,137] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt... + 6: [2023-05-10 12:37:46,138] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt... + 9: [2023-05-10 12:37:46,138] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +18: [2023-05-10 12:37:46,139] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +18: [2023-05-10 12:37:46,139] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +15: [2023-05-10 12:37:46,139] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +13: [2023-05-10 12:37:46,139] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +15: [2023-05-10 12:37:46,139] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +26: [2023-05-10 12:37:46,139] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +15: [2023-05-10 12:37:46,140] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +29: [2023-05-10 12:37:46,139] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +18: [2023-05-10 12:37:46,140] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +15: [2023-05-10 12:37:46,140] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +26: [2023-05-10 12:37:46,141] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +15: [2023-05-10 12:37:46,141] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt... + 9: [2023-05-10 12:37:46,141] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. + 9: [2023-05-10 12:37:46,141] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +20: [2023-05-10 12:37:46,141] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +15: [2023-05-10 12:37:46,141] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt... + 5: [2023-05-10 12:37:46,142] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... + 5: [2023-05-10 12:37:46,142] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +15: [2023-05-10 12:37:46,142] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +15: [2023-05-10 12:37:46,142] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt... +21: [2023-05-10 12:37:46,143] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... + 1: [2023-05-10 12:37:46,143] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. + 1: [2023-05-10 12:37:46,142] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. + 1: [2023-05-10 12:37:46,143] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +26: [2023-05-10 12:37:46,143] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... + 1: [2023-05-10 12:37:46,143] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. + 1: [2023-05-10 12:37:46,143] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt... + 1: [2023-05-10 12:37:46,143] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt... + 1: [2023-05-10 12:37:46,143] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt... + 1: [2023-05-10 12:37:46,143] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt... +26: [2023-05-10 12:37:46,143] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... + 7: [2023-05-10 12:37:46,143] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. + 7: [2023-05-10 12:37:46,143] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. + 7: [2023-05-10 12:37:46,143] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. + 7: [2023-05-10 12:37:46,144] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... + 7: [2023-05-10 12:37:46,144] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... + 7: [2023-05-10 12:37:46,144] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... + 7: [2023-05-10 12:37:46,144] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. + 7: [2023-05-10 12:37:46,144] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +14: [2023-05-10 12:37:46,145] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +13: [2023-05-10 12:37:46,145] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +28: [2023-05-10 12:37:46,145] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt. + 5: [2023-05-10 12:37:46,146] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +28: [2023-05-10 12:37:46,146] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt. +28: [2023-05-10 12:37:46,146] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt. +25: [2023-05-10 12:37:46,146] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +25: [2023-05-10 12:37:46,146] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +29: [2023-05-10 12:37:46,146] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +28: [2023-05-10 12:37:46,146] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt. +29: [2023-05-10 12:37:46,146] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +18: [2023-05-10 12:37:46,147] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +13: [2023-05-10 12:37:46,148] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +29: [2023-05-10 12:37:46,148] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... + 9: [2023-05-10 12:37:46,149] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +15: [2023-05-10 12:37:46,149] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. + 9: [2023-05-10 12:37:46,150] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... + 9: [2023-05-10 12:37:46,151] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +15: [2023-05-10 12:37:46,151] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. + 9: [2023-05-10 12:37:46,152] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +29: [2023-05-10 12:37:46,153] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +13: [2023-05-10 12:37:46,154] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +26: [2023-05-10 12:37:46,154] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +28: [2023-05-10 12:37:46,155] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +28: [2023-05-10 12:37:46,155] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +28: [2023-05-10 12:37:46,156] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +29: [2023-05-10 12:37:46,156] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +29: [2023-05-10 12:37:46,156] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +26: [2023-05-10 12:37:46,156] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt... +18: [2023-05-10 12:37:46,156] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... + 7: [2023-05-10 12:37:46,156] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +28: [2023-05-10 12:37:46,157] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +15: [2023-05-10 12:37:46,157] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +29: [2023-05-10 12:37:46,162] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +15: [2023-05-10 12:37:46,163] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... + 7: [2023-05-10 12:37:46,163] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. + 9: [2023-05-10 12:37:46,163] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... + 7: [2023-05-10 12:37:46,163] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. + 7: [2023-05-10 12:37:46,163] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. + 1: [2023-05-10 12:37:46,163] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. + 1: [2023-05-10 12:37:46,163] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. + 1: [2023-05-10 12:37:46,163] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +27: [2023-05-10 12:37:46,163] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +27: [2023-05-10 12:37:46,163] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. + 1: [2023-05-10 12:37:46,163] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. + 1: [2023-05-10 12:37:46,163] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... + 1: [2023-05-10 12:37:46,163] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +27: [2023-05-10 12:37:46,163] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +27: [2023-05-10 12:37:46,163] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... + 1: [2023-05-10 12:37:46,163] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +26: [2023-05-10 12:37:46,164] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +26: [2023-05-10 12:37:46,164] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +27: [2023-05-10 12:37:46,164] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +27: [2023-05-10 12:37:46,164] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +26: [2023-05-10 12:37:46,164] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt... +27: [2023-05-10 12:37:46,164] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +26: [2023-05-10 12:37:46,164] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt... + 1: [2023-05-10 12:37:46,165] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... + 7: [2023-05-10 12:37:46,165] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +27: [2023-05-10 12:37:46,165] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +28: [2023-05-10 12:37:46,167] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +24: [2023-05-10 12:37:46,167] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +24: [2023-05-10 12:37:46,167] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +24: [2023-05-10 12:37:46,167] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +24: [2023-05-10 12:37:46,167] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +28: [2023-05-10 12:37:46,168] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt... +24: [2023-05-10 12:37:46,167] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +24: [2023-05-10 12:37:46,167] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +24: [2023-05-10 12:37:46,167] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +24: [2023-05-10 12:37:46,169] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +26: [2023-05-10 12:37:46,169] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +26: [2023-05-10 12:37:46,171] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt... +28: [2023-05-10 12:37:46,171] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +28: [2023-05-10 12:37:46,171] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +28: [2023-05-10 12:37:46,171] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt... +28: [2023-05-10 12:37:46,171] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt... +15: [2023-05-10 12:37:46,171] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. +15: [2023-05-10 12:37:46,172] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_00-model_states.pt. + 7: [2023-05-10 12:37:46,173] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +27: [2023-05-10 12:37:46,174] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. + 7: [2023-05-10 12:37:46,176] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... + 7: [2023-05-10 12:37:46,178] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +27: [2023-05-10 12:37:46,178] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +27: [2023-05-10 12:37:46,178] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. + 1: [2023-05-10 12:37:46,178] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. + 1: [2023-05-10 12:37:46,178] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. + 1: [2023-05-10 12:37:46,179] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +28: [2023-05-10 12:37:46,180] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +28: [2023-05-10 12:37:46,181] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt... +24: [2023-05-10 12:37:46,181] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. + 8: [2023-05-10 12:37:46,183] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. + 8: [2023-05-10 12:37:46,183] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. + 8: [2023-05-10 12:37:46,183] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... + 8: [2023-05-10 12:37:46,183] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +24: [2023-05-10 12:37:46,183] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt. +24: [2023-05-10 12:37:46,183] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +12: [2023-05-10 12:37:46,183] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +12: [2023-05-10 12:37:46,183] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +12: [2023-05-10 12:37:46,183] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +27: [2023-05-10 12:37:46,183] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +24: [2023-05-10 12:37:46,183] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt. +12: [2023-05-10 12:37:46,183] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +15: [2023-05-10 12:37:46,183] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +12: [2023-05-10 12:37:46,183] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +12: [2023-05-10 12:37:46,183] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +12: [2023-05-10 12:37:46,183] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. + 2: [2023-05-10 12:37:46,183] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. + 2: [2023-05-10 12:37:46,183] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. + 2: [2023-05-10 12:37:46,183] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +15: [2023-05-10 12:37:46,183] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... + 2: [2023-05-10 12:37:46,183] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +12: [2023-05-10 12:37:46,183] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... + 2: [2023-05-10 12:37:46,183] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... + 2: [2023-05-10 12:37:46,183] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +24: [2023-05-10 12:37:46,183] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. + 2: [2023-05-10 12:37:46,184] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +24: [2023-05-10 12:37:46,184] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt. + 2: [2023-05-10 12:37:46,184] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +24: [2023-05-10 12:37:46,184] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt. +10: [2023-05-10 12:37:46,184] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +10: [2023-05-10 12:37:46,184] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +10: [2023-05-10 12:37:46,184] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +10: [2023-05-10 12:37:46,184] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +10: [2023-05-10 12:37:46,184] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +10: [2023-05-10 12:37:46,184] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +10: [2023-05-10 12:37:46,184] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +10: [2023-05-10 12:37:46,184] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... + 8: [2023-05-10 12:37:46,186] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. + 8: [2023-05-10 12:37:46,186] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... + 8: [2023-05-10 12:37:46,186] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. + 8: [2023-05-10 12:37:46,187] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +27: [2023-05-10 12:37:46,188] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... + 1: [2023-05-10 12:37:46,188] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... + 1: [2023-05-10 12:37:46,190] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +27: [2023-05-10 12:37:46,190] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +24: [2023-05-10 12:37:46,191] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... + 1: [2023-05-10 12:37:46,191] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... + 1: [2023-05-10 12:37:46,192] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +27: [2023-05-10 12:37:46,192] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +24: [2023-05-10 12:37:46,194] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +10: [2023-05-10 12:37:46,194] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +24: [2023-05-10 12:37:46,195] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +24: [2023-05-10 12:37:46,195] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +24: [2023-05-10 12:37:46,195] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +24: [2023-05-10 12:37:46,196] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... + 2: [2023-05-10 12:37:46,196] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +24: [2023-05-10 12:37:46,197] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... + 2: [2023-05-10 12:37:46,197] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +12: [2023-05-10 12:37:46,198] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +12: [2023-05-10 12:37:46,198] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. + 2: [2023-05-10 12:37:46,199] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +12: [2023-05-10 12:37:46,199] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +12: [2023-05-10 12:37:46,199] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +30: [2023-05-10 12:37:46,200] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +30: [2023-05-10 12:37:46,200] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +30: [2023-05-10 12:37:46,200] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. + 1: [2023-05-10 12:37:46,200] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +30: [2023-05-10 12:37:46,200] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +30: [2023-05-10 12:37:46,200] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +27: [2023-05-10 12:37:46,200] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +24: [2023-05-10 12:37:46,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +31: [2023-05-10 12:37:46,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +31: [2023-05-10 12:37:46,201] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +31: [2023-05-10 12:37:46,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. + 8: [2023-05-10 12:37:46,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. + 8: [2023-05-10 12:37:46,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +31: [2023-05-10 12:37:46,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +31: [2023-05-10 12:37:46,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +31: [2023-05-10 12:37:46,202] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +31: [2023-05-10 12:37:46,202] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +31: [2023-05-10 12:37:46,203] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +30: [2023-05-10 12:37:46,202] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +30: [2023-05-10 12:37:46,203] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +10: [2023-05-10 12:37:46,203] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +10: [2023-05-10 12:37:46,203] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +30: [2023-05-10 12:37:46,204] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... + 6: [2023-05-10 12:37:46,204] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. + 6: [2023-05-10 12:37:46,204] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. + 6: [2023-05-10 12:37:46,204] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. + 6: [2023-05-10 12:37:46,204] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... + 6: [2023-05-10 12:37:46,204] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... + 6: [2023-05-10 12:37:46,204] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. + 6: [2023-05-10 12:37:46,204] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +10: [2023-05-10 12:37:46,204] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +17: [2023-05-10 12:37:46,204] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +10: [2023-05-10 12:37:46,204] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +17: [2023-05-10 12:37:46,205] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +17: [2023-05-10 12:37:46,205] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +17: [2023-05-10 12:37:46,205] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +17: [2023-05-10 12:37:46,205] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +17: [2023-05-10 12:37:46,205] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +17: [2023-05-10 12:37:46,205] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... + 2: [2023-05-10 12:37:46,205] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... + 6: [2023-05-10 12:37:46,205] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... + 8: [2023-05-10 12:37:46,206] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +17: [2023-05-10 12:37:46,206] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... + 2: [2023-05-10 12:37:46,206] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... + 2: [2023-05-10 12:37:46,207] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. + 3: [2023-05-10 12:37:46,207] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt. + 3: [2023-05-10 12:37:46,207] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt. + 3: [2023-05-10 12:37:46,207] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt. + 3: [2023-05-10 12:37:46,207] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt. +16: [2023-05-10 12:37:46,208] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +16: [2023-05-10 12:37:46,208] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +16: [2023-05-10 12:37:46,208] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +16: [2023-05-10 12:37:46,208] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +16: [2023-05-10 12:37:46,208] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +12: [2023-05-10 12:37:46,208] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +16: [2023-05-10 12:37:46,208] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +16: [2023-05-10 12:37:46,208] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +16: [2023-05-10 12:37:46,208] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +24: [2023-05-10 12:37:46,209] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. + 4: [2023-05-10 12:37:46,209] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. + 4: [2023-05-10 12:37:46,209] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. + 4: [2023-05-10 12:37:46,209] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... + 4: [2023-05-10 12:37:46,209] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... + 4: [2023-05-10 12:37:46,209] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. + 4: [2023-05-10 12:37:46,209] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +23: [2023-05-10 12:37:46,209] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +24: [2023-05-10 12:37:46,209] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +23: [2023-05-10 12:37:46,209] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... + 2: [2023-05-10 12:37:46,210] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +24: [2023-05-10 12:37:46,210] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. + 4: [2023-05-10 12:37:46,210] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +12: [2023-05-10 12:37:46,210] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... + 4: [2023-05-10 12:37:46,210] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +23: [2023-05-10 12:37:46,210] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +23: [2023-05-10 12:37:46,210] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +23: [2023-05-10 12:37:46,210] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +23: [2023-05-10 12:37:46,210] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +24: [2023-05-10 12:37:46,210] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt... +24: [2023-05-10 12:37:46,210] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt... +23: [2023-05-10 12:37:46,210] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +23: [2023-05-10 12:37:46,210] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +12: [2023-05-10 12:37:46,211] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +12: [2023-05-10 12:37:46,211] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... + 8: [2023-05-10 12:37:46,211] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +30: [2023-05-10 12:37:46,211] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. + 8: [2023-05-10 12:37:46,211] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. + 8: [2023-05-10 12:37:46,214] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +31: [2023-05-10 12:37:46,214] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +10: [2023-05-10 12:37:46,214] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +17: [2023-05-10 12:37:46,215] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +10: [2023-05-10 12:37:46,216] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... + 8: [2023-05-10 12:37:46,216] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... + 3: [2023-05-10 12:37:46,216] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... + 3: [2023-05-10 12:37:46,216] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +10: [2023-05-10 12:37:46,216] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... + 2: [2023-05-10 12:37:46,216] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +31: [2023-05-10 12:37:46,216] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. + 3: [2023-05-10 12:37:46,219] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... + 3: [2023-05-10 12:37:46,219] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... + 6: [2023-05-10 12:37:46,219] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +16: [2023-05-10 12:37:46,220] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. + 6: [2023-05-10 12:37:46,220] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. + 6: [2023-05-10 12:37:46,220] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +17: [2023-05-10 12:37:46,220] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +17: [2023-05-10 12:37:46,220] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. + 4: [2023-05-10 12:37:46,220] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. + 8: [2023-05-10 12:37:46,220] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +30: [2023-05-10 12:37:46,221] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +24: [2023-05-10 12:37:46,221] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +24: [2023-05-10 12:37:46,221] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +24: [2023-05-10 12:37:46,222] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt... +31: [2023-05-10 12:37:46,222] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +23: [2023-05-10 12:37:46,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +24: [2023-05-10 12:37:46,223] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt... +16: [2023-05-10 12:37:46,223] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +16: [2023-05-10 12:37:46,224] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +16: [2023-05-10 12:37:46,224] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +23: [2023-05-10 12:37:46,225] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +23: [2023-05-10 12:37:46,225] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +31: [2023-05-10 12:37:46,225] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... + 4: [2023-05-10 12:37:46,225] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +17: [2023-05-10 12:37:46,225] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +23: [2023-05-10 12:37:46,226] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +30: [2023-05-10 12:37:46,228] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. + 4: [2023-05-10 12:37:46,228] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +30: [2023-05-10 12:37:46,228] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. + 6: [2023-05-10 12:37:46,229] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +31: [2023-05-10 12:37:46,228] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +17: [2023-05-10 12:37:46,229] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +17: [2023-05-10 12:37:46,229] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. + 3: [2023-05-10 12:37:46,228] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. + 4: [2023-05-10 12:37:46,229] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. + 3: [2023-05-10 12:37:46,229] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt... +31: [2023-05-10 12:37:46,229] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. + 4: [2023-05-10 12:37:46,230] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +23: [2023-05-10 12:37:46,231] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... + 6: [2023-05-10 12:37:46,231] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... + 3: [2023-05-10 12:37:46,231] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. + 3: [2023-05-10 12:37:46,232] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt... +16: [2023-05-10 12:37:46,232] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... + 6: [2023-05-10 12:37:46,232] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... + 6: [2023-05-10 12:37:46,232] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +17: [2023-05-10 12:37:46,234] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +30: [2023-05-10 12:37:46,234] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +16: [2023-05-10 12:37:46,235] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... + 4: [2023-05-10 12:37:46,235] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +16: [2023-05-10 12:37:46,235] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +16: [2023-05-10 12:37:46,235] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +23: [2023-05-10 12:37:46,237] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +31: [2023-05-10 12:37:46,237] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +23: [2023-05-10 12:37:46,238] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +23: [2023-05-10 12:37:46,238] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +31: [2023-05-10 12:37:46,238] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... + 4: [2023-05-10 12:37:46,239] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +30: [2023-05-10 12:37:46,240] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... + 4: [2023-05-10 12:37:46,240] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +29: [2023-05-10 12:37:46,241] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt. +30: [2023-05-10 12:37:46,241] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... + 6: [2023-05-10 12:37:46,241] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +29: [2023-05-10 12:37:46,241] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt. +29: [2023-05-10 12:37:46,241] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt. +29: [2023-05-10 12:37:46,241] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt. + 3: [2023-05-10 12:37:46,242] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +17: [2023-05-10 12:37:46,242] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... + 3: [2023-05-10 12:37:46,243] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt... +30: [2023-05-10 12:37:46,243] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +31: [2023-05-10 12:37:46,244] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt. +31: [2023-05-10 12:37:46,244] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt. +31: [2023-05-10 12:37:46,244] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt. +31: [2023-05-10 12:37:46,245] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt. +11: [2023-05-10 12:37:46,247] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +11: [2023-05-10 12:37:46,247] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +11: [2023-05-10 12:37:46,247] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +11: [2023-05-10 12:37:46,247] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... + 3: [2023-05-10 12:37:46,248] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. + 3: [2023-05-10 12:37:46,250] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt... +11: [2023-05-10 12:37:46,250] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +11: [2023-05-10 12:37:46,250] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +22: [2023-05-10 12:37:46,251] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +22: [2023-05-10 12:37:46,251] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +22: [2023-05-10 12:37:46,251] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +22: [2023-05-10 12:37:46,251] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +22: [2023-05-10 12:37:46,251] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +22: [2023-05-10 12:37:46,251] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +22: [2023-05-10 12:37:46,251] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +29: [2023-05-10 12:37:46,251] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +11: [2023-05-10 12:37:46,252] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +22: [2023-05-10 12:37:46,253] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +11: [2023-05-10 12:37:46,253] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +31: [2023-05-10 12:37:46,254] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +20: [2023-05-10 12:37:46,254] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +20: [2023-05-10 12:37:46,254] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +20: [2023-05-10 12:37:46,254] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +29: [2023-05-10 12:37:46,255] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +29: [2023-05-10 12:37:46,255] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +29: [2023-05-10 12:37:46,255] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +31: [2023-05-10 12:37:46,255] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +20: [2023-05-10 12:37:46,255] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +20: [2023-05-10 12:37:46,255] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +20: [2023-05-10 12:37:46,255] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +31: [2023-05-10 12:37:46,255] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +20: [2023-05-10 12:37:46,256] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +20: [2023-05-10 12:37:46,256] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +31: [2023-05-10 12:37:46,257] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +25: [2023-05-10 12:37:46,258] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +25: [2023-05-10 12:37:46,258] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +25: [2023-05-10 12:37:46,259] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +25: [2023-05-10 12:37:46,259] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... + 0: [2023-05-10 12:37:46,261] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. + 0: [2023-05-10 12:37:46,261] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. + 0: [2023-05-10 12:37:46,261] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. + 0: [2023-05-10 12:37:46,261] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... + 0: [2023-05-10 12:37:46,261] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... + 0: [2023-05-10 12:37:46,261] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. + 0: [2023-05-10 12:37:46,261] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +11: [2023-05-10 12:37:46,261] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +11: [2023-05-10 12:37:46,262] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +14: [2023-05-10 12:37:46,262] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +14: [2023-05-10 12:37:46,262] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +14: [2023-05-10 12:37:46,262] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +14: [2023-05-10 12:37:46,262] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +14: [2023-05-10 12:37:46,262] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +14: [2023-05-10 12:37:46,262] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +22: [2023-05-10 12:37:46,262] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +14: [2023-05-10 12:37:46,262] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +14: [2023-05-10 12:37:46,262] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... + 0: [2023-05-10 12:37:46,263] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +19: [2023-05-10 12:37:46,263] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +25: [2023-05-10 12:37:46,263] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +25: [2023-05-10 12:37:46,263] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +19: [2023-05-10 12:37:46,263] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +19: [2023-05-10 12:37:46,263] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +19: [2023-05-10 12:37:46,263] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +19: [2023-05-10 12:37:46,263] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +19: [2023-05-10 12:37:46,264] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +19: [2023-05-10 12:37:46,264] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +19: [2023-05-10 12:37:46,264] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +25: [2023-05-10 12:37:46,265] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +25: [2023-05-10 12:37:46,265] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +31: [2023-05-10 12:37:46,265] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +29: [2023-05-10 12:37:46,266] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +31: [2023-05-10 12:37:46,266] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt... +29: [2023-05-10 12:37:46,266] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt... +22: [2023-05-10 12:37:46,268] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +22: [2023-05-10 12:37:46,268] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +20: [2023-05-10 12:37:46,269] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +20: [2023-05-10 12:37:46,269] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +31: [2023-05-10 12:37:46,270] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +31: [2023-05-10 12:37:46,270] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt... +29: [2023-05-10 12:37:46,270] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +29: [2023-05-10 12:37:46,271] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt... +20: [2023-05-10 12:37:46,271] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +11: [2023-05-10 12:37:46,271] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +20: [2023-05-10 12:37:46,272] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +11: [2023-05-10 12:37:46,273] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +30: [2023-05-10 12:37:46,273] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt. +30: [2023-05-10 12:37:46,273] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt. +30: [2023-05-10 12:37:46,273] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt. +30: [2023-05-10 12:37:46,273] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt. +25: [2023-05-10 12:37:46,274] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +25: [2023-05-10 12:37:46,274] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +22: [2023-05-10 12:37:46,274] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +31: [2023-05-10 12:37:46,276] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +19: [2023-05-10 12:37:46,275] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +31: [2023-05-10 12:37:46,276] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt... +19: [2023-05-10 12:37:46,276] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +14: [2023-05-10 12:37:46,276] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +29: [2023-05-10 12:37:46,276] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +29: [2023-05-10 12:37:46,277] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt... +21: [2023-05-10 12:37:46,277] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +28: [2023-05-10 12:37:46,277] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +21: [2023-05-10 12:37:46,277] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +28: [2023-05-10 12:37:46,277] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +28: [2023-05-10 12:37:46,277] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +28: [2023-05-10 12:37:46,277] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +26: [2023-05-10 12:37:46,277] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +26: [2023-05-10 12:37:46,277] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +26: [2023-05-10 12:37:46,277] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +26: [2023-05-10 12:37:46,277] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +21: [2023-05-10 12:37:46,277] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +21: [2023-05-10 12:37:46,277] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +28: [2023-05-10 12:37:46,278] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +21: [2023-05-10 12:37:46,278] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +21: [2023-05-10 12:37:46,278] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +28: [2023-05-10 12:37:46,278] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +11: [2023-05-10 12:37:46,278] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +14: [2023-05-10 12:37:46,278] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +14: [2023-05-10 12:37:46,278] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +26: [2023-05-10 12:37:46,278] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +26: [2023-05-10 12:37:46,278] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +15: [2023-05-10 12:37:46,279] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +15: [2023-05-10 12:37:46,279] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +21: [2023-05-10 12:37:46,279] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +21: [2023-05-10 12:37:46,279] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +28: [2023-05-10 12:37:46,279] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +28: [2023-05-10 12:37:46,279] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +19: [2023-05-10 12:37:46,279] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +19: [2023-05-10 12:37:46,279] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +22: [2023-05-10 12:37:46,279] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +22: [2023-05-10 12:37:46,279] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +26: [2023-05-10 12:37:46,280] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +26: [2023-05-10 12:37:46,280] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +15: [2023-05-10 12:37:46,280] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +15: [2023-05-10 12:37:46,280] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +15: [2023-05-10 12:37:46,281] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +15: [2023-05-10 12:37:46,281] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +15: [2023-05-10 12:37:46,281] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +20: [2023-05-10 12:37:46,282] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +20: [2023-05-10 12:37:46,282] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +20: [2023-05-10 12:37:46,282] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +20: [2023-05-10 12:37:46,282] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +30: [2023-05-10 12:37:46,282] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +15: [2023-05-10 12:37:46,283] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +11: [2023-05-10 12:37:46,283] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +13: [2023-05-10 12:37:46,283] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +13: [2023-05-10 12:37:46,283] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +30: [2023-05-10 12:37:46,283] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +30: [2023-05-10 12:37:46,283] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +13: [2023-05-10 12:37:46,283] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +13: [2023-05-10 12:37:46,283] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +30: [2023-05-10 12:37:46,283] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +13: [2023-05-10 12:37:46,283] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +13: [2023-05-10 12:37:46,284] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +13: [2023-05-10 12:37:46,284] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +13: [2023-05-10 12:37:46,284] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... + 5: [2023-05-10 12:37:46,284] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. + 5: [2023-05-10 12:37:46,284] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +14: [2023-05-10 12:37:46,284] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +31: [2023-05-10 12:37:46,284] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. + 5: [2023-05-10 12:37:46,284] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. + 0: [2023-05-10 12:37:46,285] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. + 0: [2023-05-10 12:37:46,285] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. + 0: [2023-05-10 12:37:46,285] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +18: [2023-05-10 12:37:46,285] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +18: [2023-05-10 12:37:46,285] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +18: [2023-05-10 12:37:46,285] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +14: [2023-05-10 12:37:46,285] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +18: [2023-05-10 12:37:46,285] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +18: [2023-05-10 12:37:46,285] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +18: [2023-05-10 12:37:46,285] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +18: [2023-05-10 12:37:46,285] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +18: [2023-05-10 12:37:46,285] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... + 5: [2023-05-10 12:37:46,285] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. + 5: [2023-05-10 12:37:46,285] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. + 5: [2023-05-10 12:37:46,285] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... + 5: [2023-05-10 12:37:46,285] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +19: [2023-05-10 12:37:46,286] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +31: [2023-05-10 12:37:46,286] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt... + 5: [2023-05-10 12:37:46,286] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +25: [2023-05-10 12:37:46,286] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +25: [2023-05-10 12:37:46,286] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +11: [2023-05-10 12:37:46,286] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +14: [2023-05-10 12:37:46,287] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +29: [2023-05-10 12:37:46,287] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +14: [2023-05-10 12:37:46,287] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +19: [2023-05-10 12:37:46,287] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +25: [2023-05-10 12:37:46,288] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +25: [2023-05-10 12:37:46,288] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +22: [2023-05-10 12:37:46,289] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +28: [2023-05-10 12:37:46,290] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +29: [2023-05-10 12:37:46,290] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt... +26: [2023-05-10 12:37:46,290] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +19: [2023-05-10 12:37:46,290] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +19: [2023-05-10 12:37:46,291] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +21: [2023-05-10 12:37:46,291] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +15: [2023-05-10 12:37:46,291] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +26: [2023-05-10 12:37:46,291] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +11: [2023-05-10 12:37:46,291] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... + 9: [2023-05-10 12:37:46,292] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. + 9: [2023-05-10 12:37:46,292] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. + 9: [2023-05-10 12:37:46,292] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. + 9: [2023-05-10 12:37:46,292] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... + 9: [2023-05-10 12:37:46,292] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... + 9: [2023-05-10 12:37:46,292] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... + 9: [2023-05-10 12:37:46,292] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. + 9: [2023-05-10 12:37:46,293] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +14: [2023-05-10 12:37:46,293] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +21: [2023-05-10 12:37:46,293] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +21: [2023-05-10 12:37:46,294] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +13: [2023-05-10 12:37:46,294] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. + 0: [2023-05-10 12:37:46,295] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +21: [2023-05-10 12:37:46,295] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +28: [2023-05-10 12:37:46,295] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. + 0: [2023-05-10 12:37:46,295] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +30: [2023-05-10 12:37:46,295] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +30: [2023-05-10 12:37:46,296] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt... + 0: [2023-05-10 12:37:46,296] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +15: [2023-05-10 12:37:46,296] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +25: [2023-05-10 12:37:46,297] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +15: [2023-05-10 12:37:46,297] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. + 5: [2023-05-10 12:37:46,297] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +25: [2023-05-10 12:37:46,297] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +26: [2023-05-10 12:37:46,299] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +22: [2023-05-10 12:37:46,299] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +15: [2023-05-10 12:37:46,300] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... + 5: [2023-05-10 12:37:46,300] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. + 5: [2023-05-10 12:37:46,300] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +21: [2023-05-10 12:37:46,300] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +26: [2023-05-10 12:37:46,300] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +30: [2023-05-10 12:37:46,301] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +30: [2023-05-10 12:37:46,301] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +30: [2023-05-10 12:37:46,301] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +28: [2023-05-10 12:37:46,301] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +30: [2023-05-10 12:37:46,301] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt... +30: [2023-05-10 12:37:46,301] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt... +30: [2023-05-10 12:37:46,301] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt... + 0: [2023-05-10 12:37:46,302] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +13: [2023-05-10 12:37:46,303] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +13: [2023-05-10 12:37:46,303] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +13: [2023-05-10 12:37:46,303] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +13: [2023-05-10 12:37:46,303] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... + 9: [2023-05-10 12:37:46,304] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +15: [2023-05-10 12:37:46,305] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +28: [2023-05-10 12:37:46,305] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... + 9: [2023-05-10 12:37:46,305] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +21: [2023-05-10 12:37:46,305] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +21: [2023-05-10 12:37:46,306] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +21: [2023-05-10 12:37:46,306] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... + 9: [2023-05-10 12:37:46,307] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +26: [2023-05-10 12:37:46,307] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +26: [2023-05-10 12:37:46,307] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. + 9: [2023-05-10 12:37:46,307] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. + 3: [2023-05-10 12:37:46,308] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. + 3: [2023-05-10 12:37:46,308] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. + 3: [2023-05-10 12:37:46,308] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. + 3: [2023-05-10 12:37:46,308] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... + 3: [2023-05-10 12:37:46,308] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... + 3: [2023-05-10 12:37:46,308] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... + 3: [2023-05-10 12:37:46,308] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. + 5: [2023-05-10 12:37:46,309] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +18: [2023-05-10 12:37:46,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +18: [2023-05-10 12:37:46,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +18: [2023-05-10 12:37:46,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +18: [2023-05-10 12:37:46,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. + 5: [2023-05-10 12:37:46,309] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... + 5: [2023-05-10 12:37:46,309] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +28: [2023-05-10 12:37:46,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +28: [2023-05-10 12:37:46,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. + 3: [2023-05-10 12:37:46,310] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +15: [2023-05-10 12:37:46,311] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +13: [2023-05-10 12:37:46,312] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... + 0: [2023-05-10 12:37:46,312] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... + 9: [2023-05-10 12:37:46,313] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +13: [2023-05-10 12:37:46,313] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +13: [2023-05-10 12:37:46,314] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +26: [2023-05-10 12:37:46,316] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +26: [2023-05-10 12:37:46,316] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... + 9: [2023-05-10 12:37:46,317] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... + 9: [2023-05-10 12:37:46,317] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... + 5: [2023-05-10 12:37:46,317] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. + 9: [2023-05-10 12:37:46,317] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +28: [2023-05-10 12:37:46,318] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +28: [2023-05-10 12:37:46,318] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +15: [2023-05-10 12:37:46,319] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +18: [2023-05-10 12:37:46,320] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +18: [2023-05-10 12:37:46,320] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... + 3: [2023-05-10 12:37:46,321] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +18: [2023-05-10 12:37:46,322] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +18: [2023-05-10 12:37:46,323] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... + 3: [2023-05-10 12:37:46,325] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. + 3: [2023-05-10 12:37:46,325] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +15: [2023-05-10 12:37:46,328] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... + 5: [2023-05-10 12:37:46,328] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +28: [2023-05-10 12:37:46,331] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt. +28: [2023-05-10 12:37:46,331] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt. +28: [2023-05-10 12:37:46,331] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt. +28: [2023-05-10 12:37:46,331] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt. + 3: [2023-05-10 12:37:46,334] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... + 3: [2023-05-10 12:37:46,337] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... + 3: [2023-05-10 12:37:46,337] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... + 1: [2023-05-10 12:37:46,339] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt. + 1: [2023-05-10 12:37:46,339] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt. + 1: [2023-05-10 12:37:46,339] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt. + 1: [2023-05-10 12:37:46,340] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt. +28: [2023-05-10 12:37:46,340] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +26: [2023-05-10 12:37:46,341] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt. +26: [2023-05-10 12:37:46,341] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt. +26: [2023-05-10 12:37:46,341] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt. +26: [2023-05-10 12:37:46,341] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt. +28: [2023-05-10 12:37:46,342] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +28: [2023-05-10 12:37:46,342] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +28: [2023-05-10 12:37:46,342] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... + 6: [2023-05-10 12:37:46,343] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt. + 6: [2023-05-10 12:37:46,343] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt. + 6: [2023-05-10 12:37:46,343] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt. + 6: [2023-05-10 12:37:46,344] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt. + 3: [2023-05-10 12:37:46,347] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. + 1: [2023-05-10 12:37:46,348] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... + 1: [2023-05-10 12:37:46,349] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +26: [2023-05-10 12:37:46,350] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... + 1: [2023-05-10 12:37:46,351] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +26: [2023-05-10 12:37:46,351] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +26: [2023-05-10 12:37:46,351] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... + 1: [2023-05-10 12:37:46,351] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +26: [2023-05-10 12:37:46,353] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... + 6: [2023-05-10 12:37:46,354] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... + 6: [2023-05-10 12:37:46,354] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... + 6: [2023-05-10 12:37:46,354] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... + 2: [2023-05-10 12:37:46,354] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. + 2: [2023-05-10 12:37:46,355] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... + 2: [2023-05-10 12:37:46,355] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. + 2: [2023-05-10 12:37:46,355] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. + 6: [2023-05-10 12:37:46,355] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... + 2: [2023-05-10 12:37:46,355] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... + 2: [2023-05-10 12:37:46,355] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. + 2: [2023-05-10 12:37:46,355] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... + 3: [2023-05-10 12:37:46,356] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... + 2: [2023-05-10 12:37:46,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt. + 2: [2023-05-10 12:37:46,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt. + 2: [2023-05-10 12:37:46,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt. + 2: [2023-05-10 12:37:46,357] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +28: [2023-05-10 12:37:46,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. + 2: [2023-05-10 12:37:46,357] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt. + 9: [2023-05-10 12:37:46,357] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt. + 9: [2023-05-10 12:37:46,357] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt. + 9: [2023-05-10 12:37:46,357] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt. + 9: [2023-05-10 12:37:46,357] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt. +28: [2023-05-10 12:37:46,357] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt... +10: [2023-05-10 12:37:46,357] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt. +10: [2023-05-10 12:37:46,357] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt. +10: [2023-05-10 12:37:46,357] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt. + 8: [2023-05-10 12:37:46,357] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt. + 8: [2023-05-10 12:37:46,357] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt. +10: [2023-05-10 12:37:46,357] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt. + 8: [2023-05-10 12:37:46,357] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt. + 8: [2023-05-10 12:37:46,358] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt. +23: [2023-05-10 12:37:46,357] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt. +23: [2023-05-10 12:37:46,357] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt. +23: [2023-05-10 12:37:46,357] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt. +23: [2023-05-10 12:37:46,358] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt. +28: [2023-05-10 12:37:46,358] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +28: [2023-05-10 12:37:46,359] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt... +28: [2023-05-10 12:37:46,360] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +28: [2023-05-10 12:37:46,360] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt... + 1: [2023-05-10 12:37:46,362] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. + 1: [2023-05-10 12:37:46,362] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt... + 1: [2023-05-10 12:37:46,364] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. + 1: [2023-05-10 12:37:46,364] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt... +26: [2023-05-10 12:37:46,365] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +26: [2023-05-10 12:37:46,365] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt... + 9: [2023-05-10 12:37:46,366] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +23: [2023-05-10 12:37:46,366] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... + 8: [2023-05-10 12:37:46,366] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +10: [2023-05-10 12:37:46,367] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... + 2: [2023-05-10 12:37:46,367] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... + 9: [2023-05-10 12:37:46,367] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... + 2: [2023-05-10 12:37:46,367] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... + 8: [2023-05-10 12:37:46,367] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +23: [2023-05-10 12:37:46,367] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... + 8: [2023-05-10 12:37:46,368] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +10: [2023-05-10 12:37:46,368] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... + 8: [2023-05-10 12:37:46,368] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... + 2: [2023-05-10 12:37:46,369] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... + 2: [2023-05-10 12:37:46,369] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... + 9: [2023-05-10 12:37:46,369] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +10: [2023-05-10 12:37:46,369] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +10: [2023-05-10 12:37:46,369] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... + 6: [2023-05-10 12:37:46,369] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +23: [2023-05-10 12:37:46,369] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +23: [2023-05-10 12:37:46,369] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... + 6: [2023-05-10 12:37:46,369] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt... + 9: [2023-05-10 12:37:46,370] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +28: [2023-05-10 12:37:46,370] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. + 2: [2023-05-10 12:37:46,372] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. + 2: [2023-05-10 12:37:46,372] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +28: [2023-05-10 12:37:46,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt... + 2: [2023-05-10 12:37:46,373] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +24: [2023-05-10 12:37:46,374] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt. +24: [2023-05-10 12:37:46,374] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt. + 1: [2023-05-10 12:37:46,374] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +26: [2023-05-10 12:37:46,375] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +26: [2023-05-10 12:37:46,375] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt... + 0: [2023-05-10 12:37:46,375] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt. + 6: [2023-05-10 12:37:46,375] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. + 6: [2023-05-10 12:37:46,375] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. + 6: [2023-05-10 12:37:46,375] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt... + 6: [2023-05-10 12:37:46,375] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt... +24: [2023-05-10 12:37:46,375] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt. + 1: [2023-05-10 12:37:46,376] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt... +24: [2023-05-10 12:37:46,376] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt. +26: [2023-05-10 12:37:46,376] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +26: [2023-05-10 12:37:46,376] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt... + 0: [2023-05-10 12:37:46,376] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt. + 0: [2023-05-10 12:37:46,377] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt. + 0: [2023-05-10 12:37:46,377] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt. + 1: [2023-05-10 12:37:46,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +10: [2023-05-10 12:37:46,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +10: [2023-05-10 12:37:46,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt... + 8: [2023-05-10 12:37:46,380] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. + 8: [2023-05-10 12:37:46,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt... + 1: [2023-05-10 12:37:46,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt... +23: [2023-05-10 12:37:46,382] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +23: [2023-05-10 12:37:46,382] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. + 9: [2023-05-10 12:37:46,381] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +10: [2023-05-10 12:37:46,382] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +10: [2023-05-10 12:37:46,382] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt... +23: [2023-05-10 12:37:46,382] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt... +23: [2023-05-10 12:37:46,382] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt... + 2: [2023-05-10 12:37:46,382] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +26: [2023-05-10 12:37:46,382] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. + 2: [2023-05-10 12:37:46,382] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +24: [2023-05-10 12:37:46,383] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +24: [2023-05-10 12:37:46,383] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +26: [2023-05-10 12:37:46,383] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt... + 2: [2023-05-10 12:37:46,384] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... + 9: [2023-05-10 12:37:46,384] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt... + 8: [2023-05-10 12:37:46,384] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. + 8: [2023-05-10 12:37:46,384] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. + 9: [2023-05-10 12:37:46,384] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. + 8: [2023-05-10 12:37:46,384] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt... +24: [2023-05-10 12:37:46,384] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... + 8: [2023-05-10 12:37:46,384] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt... + 9: [2023-05-10 12:37:46,384] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt... +24: [2023-05-10 12:37:46,385] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +23: [2023-05-10 12:37:46,385] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +23: [2023-05-10 12:37:46,385] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. + 6: [2023-05-10 12:37:46,384] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +23: [2023-05-10 12:37:46,385] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt... +23: [2023-05-10 12:37:46,385] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt... + 6: [2023-05-10 12:37:46,386] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt... + 0: [2023-05-10 12:37:46,386] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... + 0: [2023-05-10 12:37:46,386] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... + 2: [2023-05-10 12:37:46,387] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. + 0: [2023-05-10 12:37:46,387] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... + 2: [2023-05-10 12:37:46,387] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt... + 0: [2023-05-10 12:37:46,387] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... + 8: [2023-05-10 12:37:46,388] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. + 8: [2023-05-10 12:37:46,388] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt... +10: [2023-05-10 12:37:46,388] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +10: [2023-05-10 12:37:46,388] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt... + 2: [2023-05-10 12:37:46,388] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +22: [2023-05-10 12:37:46,389] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt. +22: [2023-05-10 12:37:46,389] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt. +22: [2023-05-10 12:37:46,389] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt. +22: [2023-05-10 12:37:46,389] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt. + 1: [2023-05-10 12:37:46,390] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. + 1: [2023-05-10 12:37:46,390] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. + 1: [2023-05-10 12:37:46,390] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... + 1: [2023-05-10 12:37:46,390] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... + 1: [2023-05-10 12:37:46,391] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. + 1: [2023-05-10 12:37:46,391] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. + 2: [2023-05-10 12:37:46,391] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +12: [2023-05-10 12:37:46,391] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt. +12: [2023-05-10 12:37:46,391] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt. + 2: [2023-05-10 12:37:46,391] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt... +12: [2023-05-10 12:37:46,391] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt. +12: [2023-05-10 12:37:46,391] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt. + 1: [2023-05-10 12:37:46,392] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... + 1: [2023-05-10 12:37:46,392] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +10: [2023-05-10 12:37:46,392] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +10: [2023-05-10 12:37:46,393] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +10: [2023-05-10 12:37:46,393] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +10: [2023-05-10 12:37:46,393] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +10: [2023-05-10 12:37:46,393] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +10: [2023-05-10 12:37:46,394] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +10: [2023-05-10 12:37:46,394] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +10: [2023-05-10 12:37:46,394] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +10: [2023-05-10 12:37:46,395] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +10: [2023-05-10 12:37:46,396] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt... + 9: [2023-05-10 12:37:46,396] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. + 2: [2023-05-10 12:37:46,397] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... + 9: [2023-05-10 12:37:46,397] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt... + 9: [2023-05-10 12:37:46,398] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. + 2: [2023-05-10 12:37:46,398] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. + 9: [2023-05-10 12:37:46,399] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt... +22: [2023-05-10 12:37:46,399] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +22: [2023-05-10 12:37:46,399] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... + 2: [2023-05-10 12:37:46,399] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt... +22: [2023-05-10 12:37:46,400] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +22: [2023-05-10 12:37:46,400] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... + 2: [2023-05-10 12:37:46,400] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +12: [2023-05-10 12:37:46,400] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... + 0: [2023-05-10 12:37:46,401] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +12: [2023-05-10 12:37:46,401] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... + 0: [2023-05-10 12:37:46,402] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt... + 2: [2023-05-10 12:37:46,402] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt... +12: [2023-05-10 12:37:46,402] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... + 1: [2023-05-10 12:37:46,402] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +12: [2023-05-10 12:37:46,403] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... + 1: [2023-05-10 12:37:46,403] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. + 0: [2023-05-10 12:37:46,404] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. + 0: [2023-05-10 12:37:46,404] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. + 0: [2023-05-10 12:37:46,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt... + 0: [2023-05-10 12:37:46,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt... +29: [2023-05-10 12:37:46,406] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +29: [2023-05-10 12:37:46,406] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +29: [2023-05-10 12:37:46,406] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +29: [2023-05-10 12:37:46,406] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +29: [2023-05-10 12:37:46,406] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +29: [2023-05-10 12:37:46,406] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +29: [2023-05-10 12:37:46,406] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +29: [2023-05-10 12:37:46,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... + 0: [2023-05-10 12:37:46,408] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. + 0: [2023-05-10 12:37:46,408] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt... + 7: [2023-05-10 12:37:46,409] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt. + 7: [2023-05-10 12:37:46,409] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt. + 7: [2023-05-10 12:37:46,409] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt. +10: [2023-05-10 12:37:46,410] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +15: [2023-05-10 12:37:46,414] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt. +25: [2023-05-10 12:37:46,413] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt. +12: [2023-05-10 12:37:46,413] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. + 4: [2023-05-10 12:37:46,414] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. + 7: [2023-05-10 12:37:46,414] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt. +27: [2023-05-10 12:37:46,414] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +16: [2023-05-10 12:37:46,414] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt. +27: [2023-05-10 12:37:46,414] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... + 1: [2023-05-10 12:37:46,414] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +25: [2023-05-10 12:37:46,414] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt. + 4: [2023-05-10 12:37:46,414] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +27: [2023-05-10 12:37:46,414] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +16: [2023-05-10 12:37:46,414] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt. + 4: [2023-05-10 12:37:46,414] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +27: [2023-05-10 12:37:46,414] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +16: [2023-05-10 12:37:46,414] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt. + 1: [2023-05-10 12:37:46,415] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +19: [2023-05-10 12:37:46,415] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt. +16: [2023-05-10 12:37:46,415] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt. +19: [2023-05-10 12:37:46,415] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt. +12: [2023-05-10 12:37:46,415] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt... +15: [2023-05-10 12:37:46,415] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt. + 4: [2023-05-10 12:37:46,415] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +19: [2023-05-10 12:37:46,416] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt. +19: [2023-05-10 12:37:46,416] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt. +27: [2023-05-10 12:37:46,416] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +27: [2023-05-10 12:37:46,416] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +27: [2023-05-10 12:37:46,416] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +15: [2023-05-10 12:37:46,416] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt. +15: [2023-05-10 12:37:46,417] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt. + 4: [2023-05-10 12:37:46,417] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +25: [2023-05-10 12:37:46,417] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt. +27: [2023-05-10 12:37:46,417] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... + 4: [2023-05-10 12:37:46,417] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +25: [2023-05-10 12:37:46,418] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt. +17: [2023-05-10 12:37:46,418] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt. +17: [2023-05-10 12:37:46,418] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt. +27: [2023-05-10 12:37:46,418] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt. +21: [2023-05-10 12:37:46,418] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt. +29: [2023-05-10 12:37:46,418] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +21: [2023-05-10 12:37:46,418] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt. + 7: [2023-05-10 12:37:46,418] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +27: [2023-05-10 12:37:46,418] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt. +27: [2023-05-10 12:37:46,418] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt. + 4: [2023-05-10 12:37:46,418] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +21: [2023-05-10 12:37:46,418] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt. +27: [2023-05-10 12:37:46,419] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt. +12: [2023-05-10 12:37:46,419] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +21: [2023-05-10 12:37:46,419] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt. + 4: [2023-05-10 12:37:46,419] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +22: [2023-05-10 12:37:46,419] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +11: [2023-05-10 12:37:46,419] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt. +11: [2023-05-10 12:37:46,419] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt. +11: [2023-05-10 12:37:46,419] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt. +11: [2023-05-10 12:37:46,420] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt. + 7: [2023-05-10 12:37:46,420] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... + 1: [2023-05-10 12:37:46,419] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. + 7: [2023-05-10 12:37:46,420] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +10: [2023-05-10 12:37:46,420] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +17: [2023-05-10 12:37:46,420] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt. +12: [2023-05-10 12:37:46,421] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt... +17: [2023-05-10 12:37:46,421] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt. + 7: [2023-05-10 12:37:46,421] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. + 7: [2023-05-10 12:37:46,421] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... + 7: [2023-05-10 12:37:46,421] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. + 4: [2023-05-10 12:37:46,421] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt. + 4: [2023-05-10 12:37:46,421] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt. + 7: [2023-05-10 12:37:46,421] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +22: [2023-05-10 12:37:46,421] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt... + 4: [2023-05-10 12:37:46,421] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt. +22: [2023-05-10 12:37:46,422] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +22: [2023-05-10 12:37:46,422] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +10: [2023-05-10 12:37:46,422] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +22: [2023-05-10 12:37:46,422] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt... +22: [2023-05-10 12:37:46,422] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt... + 4: [2023-05-10 12:37:46,422] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt. +31: [2023-05-10 12:37:46,422] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt. + 8: [2023-05-10 12:37:46,422] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +31: [2023-05-10 12:37:46,422] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt. + 8: [2023-05-10 12:37:46,422] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... + 8: [2023-05-10 12:37:46,422] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +13: [2023-05-10 12:37:46,422] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt. + 8: [2023-05-10 12:37:46,423] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +13: [2023-05-10 12:37:46,423] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt. +31: [2023-05-10 12:37:46,423] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt. +13: [2023-05-10 12:37:46,423] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt. + 1: [2023-05-10 12:37:46,423] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +13: [2023-05-10 12:37:46,423] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt. +31: [2023-05-10 12:37:46,423] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt. + 7: [2023-05-10 12:37:46,423] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. + 7: [2023-05-10 12:37:46,423] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +29: [2023-05-10 12:37:46,423] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. + 8: [2023-05-10 12:37:46,423] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. + 8: [2023-05-10 12:37:46,423] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. + 8: [2023-05-10 12:37:46,423] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +22: [2023-05-10 12:37:46,423] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +22: [2023-05-10 12:37:46,424] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt... +25: [2023-05-10 12:37:46,424] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +10: [2023-05-10 12:37:46,424] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +16: [2023-05-10 12:37:46,424] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +19: [2023-05-10 12:37:46,424] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +15: [2023-05-10 12:37:46,424] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... + 7: [2023-05-10 12:37:46,424] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +20: [2023-05-10 12:37:46,424] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt. +20: [2023-05-10 12:37:46,424] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt. +29: [2023-05-10 12:37:46,425] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +29: [2023-05-10 12:37:46,425] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. + 8: [2023-05-10 12:37:46,425] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... + 7: [2023-05-10 12:37:46,425] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... + 7: [2023-05-10 12:37:46,425] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +24: [2023-05-10 12:37:46,425] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +24: [2023-05-10 12:37:46,425] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +24: [2023-05-10 12:37:46,425] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +24: [2023-05-10 12:37:46,425] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +24: [2023-05-10 12:37:46,425] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +24: [2023-05-10 12:37:46,425] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +24: [2023-05-10 12:37:46,425] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +24: [2023-05-10 12:37:46,425] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +24: [2023-05-10 12:37:46,425] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +24: [2023-05-10 12:37:46,425] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +24: [2023-05-10 12:37:46,425] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +15: [2023-05-10 12:37:46,425] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +16: [2023-05-10 12:37:46,425] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +14: [2023-05-10 12:37:46,425] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt. +14: [2023-05-10 12:37:46,426] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt. +24: [2023-05-10 12:37:46,426] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt... +24: [2023-05-10 12:37:46,426] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt... +24: [2023-05-10 12:37:46,426] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt... +24: [2023-05-10 12:37:46,426] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt... +20: [2023-05-10 12:37:46,426] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt. +16: [2023-05-10 12:37:46,426] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +14: [2023-05-10 12:37:46,426] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt. +14: [2023-05-10 12:37:46,426] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt. +18: [2023-05-10 12:37:46,426] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt. +18: [2023-05-10 12:37:46,426] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt. +18: [2023-05-10 12:37:46,426] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt. +19: [2023-05-10 12:37:46,426] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +20: [2023-05-10 12:37:46,426] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt. +18: [2023-05-10 12:37:46,426] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt. +24: [2023-05-10 12:37:46,426] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +16: [2023-05-10 12:37:46,426] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +12: [2023-05-10 12:37:46,426] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +31: [2023-05-10 12:37:46,426] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +25: [2023-05-10 12:37:46,427] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +31: [2023-05-10 12:37:46,427] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +19: [2023-05-10 12:37:46,427] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +19: [2023-05-10 12:37:46,427] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +15: [2023-05-10 12:37:46,428] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +15: [2023-05-10 12:37:46,428] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +27: [2023-05-10 12:37:46,428] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +12: [2023-05-10 12:37:46,428] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt... +17: [2023-05-10 12:37:46,428] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... + 1: [2023-05-10 12:37:46,428] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +31: [2023-05-10 12:37:46,428] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +31: [2023-05-10 12:37:46,429] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... + 5: [2023-05-10 12:37:46,429] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt. + 5: [2023-05-10 12:37:46,429] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt. + 5: [2023-05-10 12:37:46,429] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt. +11: [2023-05-10 12:37:46,429] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +11: [2023-05-10 12:37:46,429] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +10: [2023-05-10 12:37:46,429] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +25: [2023-05-10 12:37:46,429] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +25: [2023-05-10 12:37:46,429] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... + 5: [2023-05-10 12:37:46,429] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_28-model_01-model_states.pt. +27: [2023-05-10 12:37:46,429] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +12: [2023-05-10 12:37:46,429] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +12: [2023-05-10 12:37:46,429] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +17: [2023-05-10 12:37:46,429] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +12: [2023-05-10 12:37:46,429] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +29: [2023-05-10 12:37:46,430] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +11: [2023-05-10 12:37:46,430] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +31: [2023-05-10 12:37:46,430] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +31: [2023-05-10 12:37:46,430] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +11: [2023-05-10 12:37:46,430] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +12: [2023-05-10 12:37:46,430] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +12: [2023-05-10 12:37:46,430] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +31: [2023-05-10 12:37:46,430] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +31: [2023-05-10 12:37:46,430] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +17: [2023-05-10 12:37:46,431] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +21: [2023-05-10 12:37:46,431] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... + 4: [2023-05-10 12:37:46,431] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +12: [2023-05-10 12:37:46,431] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +17: [2023-05-10 12:37:46,431] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +21: [2023-05-10 12:37:46,431] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +12: [2023-05-10 12:37:46,431] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +10: [2023-05-10 12:37:46,431] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... + 1: [2023-05-10 12:37:46,432] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +21: [2023-05-10 12:37:46,432] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +12: [2023-05-10 12:37:46,432] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +12: [2023-05-10 12:37:46,432] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +21: [2023-05-10 12:37:46,432] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +31: [2023-05-10 12:37:46,432] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +13: [2023-05-10 12:37:46,433] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +13: [2023-05-10 12:37:46,433] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... + 4: [2023-05-10 12:37:46,433] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +13: [2023-05-10 12:37:46,433] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... + 7: [2023-05-10 12:37:46,433] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +10: [2023-05-10 12:37:46,433] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +27: [2023-05-10 12:37:46,433] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +27: [2023-05-10 12:37:46,433] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +13: [2023-05-10 12:37:46,433] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +12: [2023-05-10 12:37:46,433] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt... +29: [2023-05-10 12:37:46,433] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +27: [2023-05-10 12:37:46,433] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +27: [2023-05-10 12:37:46,433] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +31: [2023-05-10 12:37:46,433] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... + 7: [2023-05-10 12:37:46,433] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt... +29: [2023-05-10 12:37:46,434] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... + 8: [2023-05-10 12:37:46,434] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +27: [2023-05-10 12:37:46,434] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +31: [2023-05-10 12:37:46,434] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +16: [2023-05-10 12:37:46,434] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +16: [2023-05-10 12:37:46,435] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... + 6: [2023-05-10 12:37:46,435] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. + 6: [2023-05-10 12:37:46,435] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... + 4: [2023-05-10 12:37:46,435] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +31: [2023-05-10 12:37:46,435] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +16: [2023-05-10 12:37:46,435] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +14: [2023-05-10 12:37:46,435] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +20: [2023-05-10 12:37:46,435] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +16: [2023-05-10 12:37:46,435] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +29: [2023-05-10 12:37:46,436] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +18: [2023-05-10 12:37:46,436] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... + 6: [2023-05-10 12:37:46,436] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +14: [2023-05-10 12:37:46,436] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +20: [2023-05-10 12:37:46,436] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +20: [2023-05-10 12:37:46,436] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +18: [2023-05-10 12:37:46,436] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +16: [2023-05-10 12:37:46,436] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +16: [2023-05-10 12:37:46,436] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +14: [2023-05-10 12:37:46,437] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +14: [2023-05-10 12:37:46,437] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +20: [2023-05-10 12:37:46,437] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... + 6: [2023-05-10 12:37:46,437] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +18: [2023-05-10 12:37:46,437] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +18: [2023-05-10 12:37:46,437] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... + 4: [2023-05-10 12:37:46,437] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +19: [2023-05-10 12:37:46,437] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +24: [2023-05-10 12:37:46,437] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. + 4: [2023-05-10 12:37:46,437] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +24: [2023-05-10 12:37:46,438] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +17: [2023-05-10 12:37:46,438] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +16: [2023-05-10 12:37:46,438] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +24: [2023-05-10 12:37:46,438] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +17: [2023-05-10 12:37:46,438] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +19: [2023-05-10 12:37:46,439] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt... +17: [2023-05-10 12:37:46,439] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +17: [2023-05-10 12:37:46,439] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +27: [2023-05-10 12:37:46,439] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +17: [2023-05-10 12:37:46,439] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +17: [2023-05-10 12:37:46,439] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... + 5: [2023-05-10 12:37:46,439] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... + 6: [2023-05-10 12:37:46,439] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. + 5: [2023-05-10 12:37:46,440] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +16: [2023-05-10 12:37:46,439] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... + 6: [2023-05-10 12:37:46,440] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +17: [2023-05-10 12:37:46,440] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... + 5: [2023-05-10 12:37:46,440] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +15: [2023-05-10 12:37:46,440] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +10: [2023-05-10 12:37:46,440] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +31: [2023-05-10 12:37:46,440] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +17: [2023-05-10 12:37:46,441] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +25: [2023-05-10 12:37:46,441] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. + 6: [2023-05-10 12:37:46,441] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... + 6: [2023-05-10 12:37:46,441] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +25: [2023-05-10 12:37:46,441] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt... + 7: [2023-05-10 12:37:46,441] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. + 7: [2023-05-10 12:37:46,442] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt... + 5: [2023-05-10 12:37:46,442] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt... +11: [2023-05-10 12:37:46,442] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +11: [2023-05-10 12:37:46,442] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +11: [2023-05-10 12:37:46,442] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... + 8: [2023-05-10 12:37:46,442] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. + 8: [2023-05-10 12:37:46,442] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +30: [2023-05-10 12:37:46,442] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +11: [2023-05-10 12:37:46,442] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +30: [2023-05-10 12:37:46,442] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +30: [2023-05-10 12:37:46,442] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +30: [2023-05-10 12:37:46,442] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +30: [2023-05-10 12:37:46,442] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +11: [2023-05-10 12:37:46,442] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +30: [2023-05-10 12:37:46,442] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +11: [2023-05-10 12:37:46,443] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +25: [2023-05-10 12:37:46,443] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +25: [2023-05-10 12:37:46,443] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt... +30: [2023-05-10 12:37:46,443] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +27: [2023-05-10 12:37:46,443] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +30: [2023-05-10 12:37:46,443] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +15: [2023-05-10 12:37:46,443] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt... +21: [2023-05-10 12:37:46,444] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +12: [2023-05-10 12:37:46,443] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. + 4: [2023-05-10 12:37:46,444] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... + 7: [2023-05-10 12:37:46,444] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. + 7: [2023-05-10 12:37:46,444] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt... +21: [2023-05-10 12:37:46,444] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt... +27: [2023-05-10 12:37:46,444] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +27: [2023-05-10 12:37:46,444] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt... +16: [2023-05-10 12:37:46,444] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +11: [2023-05-10 12:37:46,444] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. + 4: [2023-05-10 12:37:46,445] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +27: [2023-05-10 12:37:46,445] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +16: [2023-05-10 12:37:46,445] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt... +19: [2023-05-10 12:37:46,445] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +19: [2023-05-10 12:37:46,445] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt... +11: [2023-05-10 12:37:46,446] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +15: [2023-05-10 12:37:46,446] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +15: [2023-05-10 12:37:46,446] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt... +24: [2023-05-10 12:37:46,446] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... + 8: [2023-05-10 12:37:46,446] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +13: [2023-05-10 12:37:46,446] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. + 7: [2023-05-10 12:37:46,446] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. + 7: [2023-05-10 12:37:46,446] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. + 7: [2023-05-10 12:37:46,446] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt... +15: [2023-05-10 12:37:46,447] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +15: [2023-05-10 12:37:46,447] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +15: [2023-05-10 12:37:46,447] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt... +17: [2023-05-10 12:37:46,446] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +15: [2023-05-10 12:37:46,447] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt... +25: [2023-05-10 12:37:46,447] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +19: [2023-05-10 12:37:46,447] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +17: [2023-05-10 12:37:46,447] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt... +19: [2023-05-10 12:37:46,447] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt... +13: [2023-05-10 12:37:46,447] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt... +22: [2023-05-10 12:37:46,448] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +22: [2023-05-10 12:37:46,448] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +22: [2023-05-10 12:37:46,448] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +25: [2023-05-10 12:37:46,448] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt... + 6: [2023-05-10 12:37:46,448] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +24: [2023-05-10 12:37:46,449] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +31: [2023-05-10 12:37:46,449] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +11: [2023-05-10 12:37:46,448] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +13: [2023-05-10 12:37:46,449] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +13: [2023-05-10 12:37:46,449] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +21: [2023-05-10 12:37:46,449] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +21: [2023-05-10 12:37:46,449] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +27: [2023-05-10 12:37:46,449] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +13: [2023-05-10 12:37:46,449] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt... +21: [2023-05-10 12:37:46,449] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt... +21: [2023-05-10 12:37:46,449] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt... +27: [2023-05-10 12:37:46,449] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt... +13: [2023-05-10 12:37:46,449] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt... + 7: [2023-05-10 12:37:46,449] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +11: [2023-05-10 12:37:46,449] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt... + 4: [2023-05-10 12:37:46,450] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +27: [2023-05-10 12:37:46,450] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +31: [2023-05-10 12:37:46,450] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +31: [2023-05-10 12:37:46,450] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +22: [2023-05-10 12:37:46,450] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... + 4: [2023-05-10 12:37:46,450] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +24: [2023-05-10 12:37:46,450] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +22: [2023-05-10 12:37:46,451] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +16: [2023-05-10 12:37:46,451] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +14: [2023-05-10 12:37:46,451] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +30: [2023-05-10 12:37:46,450] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt. +30: [2023-05-10 12:37:46,450] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt. +30: [2023-05-10 12:37:46,450] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt. +30: [2023-05-10 12:37:46,451] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt. +22: [2023-05-10 12:37:46,451] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +18: [2023-05-10 12:37:46,451] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +14: [2023-05-10 12:37:46,451] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt... +18: [2023-05-10 12:37:46,452] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt... + 8: [2023-05-10 12:37:46,452] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... + 8: [2023-05-10 12:37:46,452] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +11: [2023-05-10 12:37:46,452] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +11: [2023-05-10 12:37:46,452] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt... +16: [2023-05-10 12:37:46,452] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +16: [2023-05-10 12:37:46,452] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +22: [2023-05-10 12:37:46,453] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +25: [2023-05-10 12:37:46,453] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +24: [2023-05-10 12:37:46,453] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +22: [2023-05-10 12:37:46,453] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... + 4: [2023-05-10 12:37:46,453] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +17: [2023-05-10 12:37:46,453] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +17: [2023-05-10 12:37:46,453] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +17: [2023-05-10 12:37:46,453] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt... +17: [2023-05-10 12:37:46,453] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt... +19: [2023-05-10 12:37:46,454] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. + 3: [2023-05-10 12:37:46,454] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt. + 4: [2023-05-10 12:37:46,454] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt... + 3: [2023-05-10 12:37:46,454] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt. +25: [2023-05-10 12:37:46,454] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt... +14: [2023-05-10 12:37:46,454] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +14: [2023-05-10 12:37:46,454] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt... +16: [2023-05-10 12:37:46,454] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt... +16: [2023-05-10 12:37:46,454] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt... + 4: [2023-05-10 12:37:46,454] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +20: [2023-05-10 12:37:46,454] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +14: [2023-05-10 12:37:46,454] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +28: [2023-05-10 12:37:46,454] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +28: [2023-05-10 12:37:46,454] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +28: [2023-05-10 12:37:46,454] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +14: [2023-05-10 12:37:46,454] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt... + 7: [2023-05-10 12:37:46,454] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +28: [2023-05-10 12:37:46,455] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +28: [2023-05-10 12:37:46,455] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +11: [2023-05-10 12:37:46,454] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +11: [2023-05-10 12:37:46,454] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt... +28: [2023-05-10 12:37:46,455] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +28: [2023-05-10 12:37:46,455] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +11: [2023-05-10 12:37:46,455] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +11: [2023-05-10 12:37:46,455] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt... +16: [2023-05-10 12:37:46,455] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +23: [2023-05-10 12:37:46,455] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +23: [2023-05-10 12:37:46,455] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... + 7: [2023-05-10 12:37:46,455] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +19: [2023-05-10 12:37:46,455] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt... + 5: [2023-05-10 12:37:46,456] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +31: [2023-05-10 12:37:46,455] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +12: [2023-05-10 12:37:46,456] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +18: [2023-05-10 12:37:46,455] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +18: [2023-05-10 12:37:46,455] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt... +17: [2023-05-10 12:37:46,456] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +20: [2023-05-10 12:37:46,456] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt... +18: [2023-05-10 12:37:46,456] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +21: [2023-05-10 12:37:46,456] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +18: [2023-05-10 12:37:46,456] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt... + 5: [2023-05-10 12:37:46,456] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt... + 5: [2023-05-10 12:37:46,456] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. + 3: [2023-05-10 12:37:46,456] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt. + 5: [2023-05-10 12:37:46,456] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt... +31: [2023-05-10 12:37:46,457] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +23: [2023-05-10 12:37:46,457] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +28: [2023-05-10 12:37:46,457] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... + 3: [2023-05-10 12:37:46,457] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt. +21: [2023-05-10 12:37:46,457] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt... +30: [2023-05-10 12:37:46,457] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +31: [2023-05-10 12:37:46,457] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt... +16: [2023-05-10 12:37:46,457] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +20: [2023-05-10 12:37:46,458] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +13: [2023-05-10 12:37:46,458] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +23: [2023-05-10 12:37:46,458] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +20: [2023-05-10 12:37:46,458] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt... +12: [2023-05-10 12:37:46,458] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +27: [2023-05-10 12:37:46,458] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +17: [2023-05-10 12:37:46,458] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +23: [2023-05-10 12:37:46,459] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +23: [2023-05-10 12:37:46,459] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +23: [2023-05-10 12:37:46,459] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +11: [2023-05-10 12:37:46,459] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +13: [2023-05-10 12:37:46,459] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt... + 4: [2023-05-10 12:37:46,459] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... + 4: [2023-05-10 12:37:46,459] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. + 4: [2023-05-10 12:37:46,460] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt... +30: [2023-05-10 12:37:46,460] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +31: [2023-05-10 12:37:46,460] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +30: [2023-05-10 12:37:46,460] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +31: [2023-05-10 12:37:46,460] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +27: [2023-05-10 12:37:46,460] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. + 5: [2023-05-10 12:37:46,460] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +16: [2023-05-10 12:37:46,460] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... + 5: [2023-05-10 12:37:46,460] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt... +17: [2023-05-10 12:37:46,460] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt... + 6: [2023-05-10 12:37:46,460] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... + 8: [2023-05-10 12:37:46,460] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +20: [2023-05-10 12:37:46,460] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +20: [2023-05-10 12:37:46,461] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +17: [2023-05-10 12:37:46,461] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +26: [2023-05-10 12:37:46,461] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +26: [2023-05-10 12:37:46,461] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. + 6: [2023-05-10 12:37:46,461] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +26: [2023-05-10 12:37:46,461] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +26: [2023-05-10 12:37:46,461] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +26: [2023-05-10 12:37:46,461] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +26: [2023-05-10 12:37:46,461] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +23: [2023-05-10 12:37:46,461] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +26: [2023-05-10 12:37:46,461] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +27: [2023-05-10 12:37:46,461] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt... +26: [2023-05-10 12:37:46,461] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +24: [2023-05-10 12:37:46,461] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +12: [2023-05-10 12:37:46,461] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. + 4: [2023-05-10 12:37:46,462] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. + 4: [2023-05-10 12:37:46,462] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt... +11: [2023-05-10 12:37:46,462] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +11: [2023-05-10 12:37:46,462] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +18: [2023-05-10 12:37:46,462] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. + 4: [2023-05-10 12:37:46,462] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +30: [2023-05-10 12:37:46,462] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +27: [2023-05-10 12:37:46,462] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +20: [2023-05-10 12:37:46,463] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +30: [2023-05-10 12:37:46,463] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +12: [2023-05-10 12:37:46,463] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. + 7: [2023-05-10 12:37:46,463] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +27: [2023-05-10 12:37:46,464] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt... +16: [2023-05-10 12:37:46,464] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +22: [2023-05-10 12:37:46,464] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. + 7: [2023-05-10 12:37:46,464] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +18: [2023-05-10 12:37:46,464] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt... + 7: [2023-05-10 12:37:46,464] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... + 6: [2023-05-10 12:37:46,465] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +20: [2023-05-10 12:37:46,464] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +20: [2023-05-10 12:37:46,465] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +30: [2023-05-10 12:37:46,465] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +31: [2023-05-10 12:37:46,465] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +30: [2023-05-10 12:37:46,465] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +20: [2023-05-10 12:37:46,465] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +16: [2023-05-10 12:37:46,465] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... + 3: [2023-05-10 12:37:46,465] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +20: [2023-05-10 12:37:46,465] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +30: [2023-05-10 12:37:46,465] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +20: [2023-05-10 12:37:46,465] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... + 3: [2023-05-10 12:37:46,465] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +31: [2023-05-10 12:37:46,465] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +16: [2023-05-10 12:37:46,465] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt... +20: [2023-05-10 12:37:46,465] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt... +31: [2023-05-10 12:37:46,465] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt... + 4: [2023-05-10 12:37:46,465] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +14: [2023-05-10 12:37:46,466] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. + 3: [2023-05-10 12:37:46,466] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... + 3: [2023-05-10 12:37:46,466] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +20: [2023-05-10 12:37:46,467] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... + 4: [2023-05-10 12:37:46,467] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt... +23: [2023-05-10 12:37:46,467] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +16: [2023-05-10 12:37:46,467] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +14: [2023-05-10 12:37:46,467] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt... +17: [2023-05-10 12:37:46,467] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... + 6: [2023-05-10 12:37:46,467] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +20: [2023-05-10 12:37:46,468] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +12: [2023-05-10 12:37:46,468] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +17: [2023-05-10 12:37:46,468] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +31: [2023-05-10 12:37:46,468] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +30: [2023-05-10 12:37:46,469] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... + 8: [2023-05-10 12:37:46,469] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +31: [2023-05-10 12:37:46,470] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt... +31: [2023-05-10 12:37:46,470] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. + 6: [2023-05-10 12:37:46,470] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +17: [2023-05-10 12:37:46,470] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +23: [2023-05-10 12:37:46,470] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +20: [2023-05-10 12:37:46,471] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt... + 5: [2023-05-10 12:37:46,471] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_00-model_states.pt. +12: [2023-05-10 12:37:46,471] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +11: [2023-05-10 12:37:46,471] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +11: [2023-05-10 12:37:46,471] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +16: [2023-05-10 12:37:46,472] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +31: [2023-05-10 12:37:46,472] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt... +12: [2023-05-10 12:37:46,472] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +28: [2023-05-10 12:37:46,472] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +28: [2023-05-10 12:37:46,472] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +20: [2023-05-10 12:37:46,473] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. + 6: [2023-05-10 12:37:46,473] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +26: [2023-05-10 12:37:46,473] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. + 5: [2023-05-10 12:37:46,473] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt... +11: [2023-05-10 12:37:46,474] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +26: [2023-05-10 12:37:46,474] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +11: [2023-05-10 12:37:46,474] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +22: [2023-05-10 12:37:46,474] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... + 7: [2023-05-10 12:37:46,475] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +23: [2023-05-10 12:37:46,475] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... + 6: [2023-05-10 12:37:46,476] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +17: [2023-05-10 12:37:46,477] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +26: [2023-05-10 12:37:46,477] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +26: [2023-05-10 12:37:46,477] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +22: [2023-05-10 12:37:46,478] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +28: [2023-05-10 12:37:46,478] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. + 3: [2023-05-10 12:37:46,478] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. + 3: [2023-05-10 12:37:46,479] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt... +17: [2023-05-10 12:37:46,479] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +30: [2023-05-10 12:37:46,479] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +30: [2023-05-10 12:37:46,479] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +23: [2023-05-10 12:37:46,480] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... + 3: [2023-05-10 12:37:46,480] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +30: [2023-05-10 12:37:46,480] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... + 3: [2023-05-10 12:37:46,480] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt... +20: [2023-05-10 12:37:46,480] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +22: [2023-05-10 12:37:46,480] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +30: [2023-05-10 12:37:46,480] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +30: [2023-05-10 12:37:46,481] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +16: [2023-05-10 12:37:46,481] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +30: [2023-05-10 12:37:46,482] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt... +30: [2023-05-10 12:37:46,482] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt... +26: [2023-05-10 12:37:46,482] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +20: [2023-05-10 12:37:46,483] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +23: [2023-05-10 12:37:46,482] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +28: [2023-05-10 12:37:46,483] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +28: [2023-05-10 12:37:46,483] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +26: [2023-05-10 12:37:46,483] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +11: [2023-05-10 12:37:46,485] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +23: [2023-05-10 12:37:46,486] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +22: [2023-05-10 12:37:46,486] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +22: [2023-05-10 12:37:46,487] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +28: [2023-05-10 12:37:46,487] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +26: [2023-05-10 12:37:46,487] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +17: [2023-05-10 12:37:46,488] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +26: [2023-05-10 12:37:46,488] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +20: [2023-05-10 12:37:46,489] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +28: [2023-05-10 12:37:46,489] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... + 3: [2023-05-10 12:37:46,489] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +22: [2023-05-10 12:37:46,490] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... + 3: [2023-05-10 12:37:46,490] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. + 3: [2023-05-10 12:37:46,491] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt... + 3: [2023-05-10 12:37:46,492] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt... +23: [2023-05-10 12:37:46,492] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +29: [2023-05-10 12:37:46,492] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt. +29: [2023-05-10 12:37:46,492] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt. +29: [2023-05-10 12:37:46,492] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt. +30: [2023-05-10 12:37:46,492] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +30: [2023-05-10 12:37:46,493] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +29: [2023-05-10 12:37:46,494] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt. +20: [2023-05-10 12:37:46,494] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +30: [2023-05-10 12:37:46,494] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt... +30: [2023-05-10 12:37:46,495] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt... +22: [2023-05-10 12:37:46,495] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +28: [2023-05-10 12:37:46,496] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +23: [2023-05-10 12:37:46,496] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +14: [2023-05-10 12:37:46,496] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +14: [2023-05-10 12:37:46,496] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +14: [2023-05-10 12:37:46,496] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +14: [2023-05-10 12:37:46,496] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +14: [2023-05-10 12:37:46,496] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +14: [2023-05-10 12:37:46,496] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +14: [2023-05-10 12:37:46,496] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +14: [2023-05-10 12:37:46,496] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +20: [2023-05-10 12:37:46,496] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +15: [2023-05-10 12:37:46,497] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +15: [2023-05-10 12:37:46,497] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +15: [2023-05-10 12:37:46,497] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +15: [2023-05-10 12:37:46,497] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +15: [2023-05-10 12:37:46,497] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +15: [2023-05-10 12:37:46,497] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +15: [2023-05-10 12:37:46,497] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +15: [2023-05-10 12:37:46,499] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +29: [2023-05-10 12:37:46,503] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +20: [2023-05-10 12:37:46,503] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +25: [2023-05-10 12:37:46,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +25: [2023-05-10 12:37:46,503] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +25: [2023-05-10 12:37:46,504] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +25: [2023-05-10 12:37:46,504] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +29: [2023-05-10 12:37:46,505] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +29: [2023-05-10 12:37:46,505] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +29: [2023-05-10 12:37:46,505] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +20: [2023-05-10 12:37:46,505] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +25: [2023-05-10 12:37:46,507] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +25: [2023-05-10 12:37:46,507] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +25: [2023-05-10 12:37:46,508] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +14: [2023-05-10 12:37:46,508] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +14: [2023-05-10 12:37:46,508] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +25: [2023-05-10 12:37:46,509] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +15: [2023-05-10 12:37:46,509] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. + 0: [2023-05-10 12:37:46,510] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. + 0: [2023-05-10 12:37:46,510] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. + 0: [2023-05-10 12:37:46,510] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. + 0: [2023-05-10 12:37:46,510] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... + 0: [2023-05-10 12:37:46,510] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... + 0: [2023-05-10 12:37:46,510] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +14: [2023-05-10 12:37:46,510] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +14: [2023-05-10 12:37:46,510] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +15: [2023-05-10 12:37:46,512] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +15: [2023-05-10 12:37:46,513] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. + 0: [2023-05-10 12:37:46,514] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +25: [2023-05-10 12:37:46,514] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +25: [2023-05-10 12:37:46,515] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. + 0: [2023-05-10 12:37:46,517] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +15: [2023-05-10 12:37:46,518] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +14: [2023-05-10 12:37:46,519] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +29: [2023-05-10 12:37:46,519] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +14: [2023-05-10 12:37:46,520] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +14: [2023-05-10 12:37:46,520] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +14: [2023-05-10 12:37:46,520] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +29: [2023-05-10 12:37:46,521] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt... +15: [2023-05-10 12:37:46,524] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +15: [2023-05-10 12:37:46,524] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +25: [2023-05-10 12:37:46,525] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +25: [2023-05-10 12:37:46,526] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +29: [2023-05-10 12:37:46,527] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +29: [2023-05-10 12:37:46,527] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt... +10: [2023-05-10 12:37:46,528] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +10: [2023-05-10 12:37:46,528] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +10: [2023-05-10 12:37:46,528] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +10: [2023-05-10 12:37:46,528] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +29: [2023-05-10 12:37:46,528] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +29: [2023-05-10 12:37:46,528] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt... +10: [2023-05-10 12:37:46,529] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +10: [2023-05-10 12:37:46,529] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +10: [2023-05-10 12:37:46,529] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +10: [2023-05-10 12:37:46,529] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +15: [2023-05-10 12:37:46,530] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +29: [2023-05-10 12:37:46,533] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +29: [2023-05-10 12:37:46,535] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt... +25: [2023-05-10 12:37:46,535] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. + 9: [2023-05-10 12:37:46,536] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +25: [2023-05-10 12:37:46,536] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. + 9: [2023-05-10 12:37:46,536] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... + 9: [2023-05-10 12:37:46,536] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. + 9: [2023-05-10 12:37:46,536] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. + 9: [2023-05-10 12:37:46,536] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... + 9: [2023-05-10 12:37:46,536] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... + 9: [2023-05-10 12:37:46,536] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. + 3: [2023-05-10 12:37:46,537] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. + 3: [2023-05-10 12:37:46,537] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... + 9: [2023-05-10 12:37:46,537] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... + 8: [2023-05-10 12:37:46,537] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt. + 8: [2023-05-10 12:37:46,537] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt. + 8: [2023-05-10 12:37:46,538] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt. + 8: [2023-05-10 12:37:46,538] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt. + 3: [2023-05-10 12:37:46,539] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. + 0: [2023-05-10 12:37:46,539] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. + 0: [2023-05-10 12:37:46,539] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. + 0: [2023-05-10 12:37:46,539] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. + 2: [2023-05-10 12:37:46,539] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. + 2: [2023-05-10 12:37:46,539] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. + 2: [2023-05-10 12:37:46,539] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... + 2: [2023-05-10 12:37:46,539] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... + 2: [2023-05-10 12:37:46,539] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. + 2: [2023-05-10 12:37:46,539] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +10: [2023-05-10 12:37:46,539] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. + 2: [2023-05-10 12:37:46,539] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. + 2: [2023-05-10 12:37:46,540] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... + 2: [2023-05-10 12:37:46,540] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt. + 2: [2023-05-10 12:37:46,540] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt. + 3: [2023-05-10 12:37:46,540] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +15: [2023-05-10 12:37:46,541] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... + 3: [2023-05-10 12:37:46,542] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. + 3: [2023-05-10 12:37:46,542] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. + 2: [2023-05-10 12:37:46,543] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt. + 2: [2023-05-10 12:37:46,543] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt. + 3: [2023-05-10 12:37:46,543] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... + 3: [2023-05-10 12:37:46,544] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +25: [2023-05-10 12:37:46,545] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +25: [2023-05-10 12:37:46,545] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... + 8: [2023-05-10 12:37:46,547] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +13: [2023-05-10 12:37:46,547] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +13: [2023-05-10 12:37:46,548] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... + 8: [2023-05-10 12:37:46,548] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... + 8: [2023-05-10 12:37:46,548] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +13: [2023-05-10 12:37:46,548] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +13: [2023-05-10 12:37:46,548] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +13: [2023-05-10 12:37:46,548] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +13: [2023-05-10 12:37:46,548] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +13: [2023-05-10 12:37:46,548] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... + 9: [2023-05-10 12:37:46,548] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +19: [2023-05-10 12:37:46,548] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. + 8: [2023-05-10 12:37:46,548] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +19: [2023-05-10 12:37:46,548] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +10: [2023-05-10 12:37:46,549] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +10: [2023-05-10 12:37:46,549] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +19: [2023-05-10 12:37:46,549] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. + 0: [2023-05-10 12:37:46,549] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +10: [2023-05-10 12:37:46,549] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +10: [2023-05-10 12:37:46,549] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... + 0: [2023-05-10 12:37:46,550] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +13: [2023-05-10 12:37:46,549] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +19: [2023-05-10 12:37:46,550] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +19: [2023-05-10 12:37:46,550] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +19: [2023-05-10 12:37:46,550] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. + 9: [2023-05-10 12:37:46,550] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. + 9: [2023-05-10 12:37:46,550] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +19: [2023-05-10 12:37:46,551] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... + 0: [2023-05-10 12:37:46,551] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +23: [2023-05-10 12:37:46,551] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt. +23: [2023-05-10 12:37:46,551] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt. +23: [2023-05-10 12:37:46,551] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt. +23: [2023-05-10 12:37:46,551] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt. +21: [2023-05-10 12:37:46,552] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +21: [2023-05-10 12:37:46,552] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +21: [2023-05-10 12:37:46,552] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +21: [2023-05-10 12:37:46,552] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +21: [2023-05-10 12:37:46,552] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +21: [2023-05-10 12:37:46,552] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +19: [2023-05-10 12:37:46,553] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... + 2: [2023-05-10 12:37:46,553] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... + 2: [2023-05-10 12:37:46,553] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +21: [2023-05-10 12:37:46,553] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +21: [2023-05-10 12:37:46,553] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... + 2: [2023-05-10 12:37:46,555] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... + 2: [2023-05-10 12:37:46,555] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... + 9: [2023-05-10 12:37:46,556] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... + 2: [2023-05-10 12:37:46,557] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. + 2: [2023-05-10 12:37:46,557] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +13: [2023-05-10 12:37:46,558] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +10: [2023-05-10 12:37:46,558] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +10: [2023-05-10 12:37:46,559] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... + 2: [2023-05-10 12:37:46,559] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. + 2: [2023-05-10 12:37:46,559] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. + 0: [2023-05-10 12:37:46,560] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +24: [2023-05-10 12:37:46,560] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +24: [2023-05-10 12:37:46,560] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +24: [2023-05-10 12:37:46,560] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +24: [2023-05-10 12:37:46,560] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +24: [2023-05-10 12:37:46,560] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... + 9: [2023-05-10 12:37:46,560] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +24: [2023-05-10 12:37:46,560] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. + 3: [2023-05-10 12:37:46,560] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +23: [2023-05-10 12:37:46,561] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... + 9: [2023-05-10 12:37:46,561] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +24: [2023-05-10 12:37:46,561] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +24: [2023-05-10 12:37:46,562] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +10: [2023-05-10 12:37:46,562] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... + 9: [2023-05-10 12:37:46,562] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... + 3: [2023-05-10 12:37:46,563] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +23: [2023-05-10 12:37:46,563] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... + 5: [2023-05-10 12:37:46,563] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. + 5: [2023-05-10 12:37:46,563] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. + 5: [2023-05-10 12:37:46,563] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. + 5: [2023-05-10 12:37:46,563] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... + 5: [2023-05-10 12:37:46,563] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... + 5: [2023-05-10 12:37:46,563] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... + 5: [2023-05-10 12:37:46,564] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +23: [2023-05-10 12:37:46,564] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... + 5: [2023-05-10 12:37:46,564] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +23: [2023-05-10 12:37:46,564] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... + 8: [2023-05-10 12:37:46,566] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +13: [2023-05-10 12:37:46,566] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. + 8: [2023-05-10 12:37:46,566] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt... +19: [2023-05-10 12:37:46,566] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. + 8: [2023-05-10 12:37:46,566] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +21: [2023-05-10 12:37:46,566] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +21: [2023-05-10 12:37:46,566] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. + 8: [2023-05-10 12:37:46,567] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt... +19: [2023-05-10 12:37:46,567] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +13: [2023-05-10 12:37:46,567] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... + 3: [2023-05-10 12:37:46,567] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. + 0: [2023-05-10 12:37:46,568] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... + 8: [2023-05-10 12:37:46,569] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. + 8: [2023-05-10 12:37:46,569] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. + 8: [2023-05-10 12:37:46,569] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt... + 8: [2023-05-10 12:37:46,569] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt... + 3: [2023-05-10 12:37:46,570] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... + 2: [2023-05-10 12:37:46,570] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... + 2: [2023-05-10 12:37:46,570] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... + 9: [2023-05-10 12:37:46,570] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... + 2: [2023-05-10 12:37:46,571] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... + 2: [2023-05-10 12:37:46,572] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. + 3: [2023-05-10 12:37:46,573] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... + 2: [2023-05-10 12:37:46,573] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... + 2: [2023-05-10 12:37:46,573] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt... +24: [2023-05-10 12:37:46,573] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +24: [2023-05-10 12:37:46,573] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +13: [2023-05-10 12:37:46,573] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. + 2: [2023-05-10 12:37:46,574] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. + 2: [2023-05-10 12:37:46,574] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt... + 2: [2023-05-10 12:37:46,574] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +23: [2023-05-10 12:37:46,574] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. + 2: [2023-05-10 12:37:46,574] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt... +19: [2023-05-10 12:37:46,575] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +23: [2023-05-10 12:37:46,575] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt... +19: [2023-05-10 12:37:46,575] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +19: [2023-05-10 12:37:46,575] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +18: [2023-05-10 12:37:46,575] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +18: [2023-05-10 12:37:46,575] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +18: [2023-05-10 12:37:46,575] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +18: [2023-05-10 12:37:46,575] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +18: [2023-05-10 12:37:46,575] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +18: [2023-05-10 12:37:46,575] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +18: [2023-05-10 12:37:46,575] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... + 3: [2023-05-10 12:37:46,575] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +21: [2023-05-10 12:37:46,576] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... + 3: [2023-05-10 12:37:46,576] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +13: [2023-05-10 12:37:46,576] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +18: [2023-05-10 12:37:46,577] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +21: [2023-05-10 12:37:46,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +31: [2023-05-10 12:37:46,578] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +31: [2023-05-10 12:37:46,579] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +31: [2023-05-10 12:37:46,579] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +21: [2023-05-10 12:37:46,579] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +21: [2023-05-10 12:37:46,579] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +31: [2023-05-10 12:37:46,579] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +31: [2023-05-10 12:37:46,579] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +31: [2023-05-10 12:37:46,579] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... + 5: [2023-05-10 12:37:46,578] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. + 5: [2023-05-10 12:37:46,578] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +31: [2023-05-10 12:37:46,579] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. + 2: [2023-05-10 12:37:46,579] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +31: [2023-05-10 12:37:46,579] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... + 2: [2023-05-10 12:37:46,579] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt... + 5: [2023-05-10 12:37:46,579] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. + 5: [2023-05-10 12:37:46,580] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +24: [2023-05-10 12:37:46,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +13: [2023-05-10 12:37:46,583] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +13: [2023-05-10 12:37:46,583] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +19: [2023-05-10 12:37:46,584] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +19: [2023-05-10 12:37:46,584] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +24: [2023-05-10 12:37:46,585] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +23: [2023-05-10 12:37:46,585] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. + 3: [2023-05-10 12:37:46,585] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +23: [2023-05-10 12:37:46,586] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt... +24: [2023-05-10 12:37:46,587] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +21: [2023-05-10 12:37:46,588] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +24: [2023-05-10 12:37:46,588] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +21: [2023-05-10 12:37:46,588] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... + 5: [2023-05-10 12:37:46,588] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +23: [2023-05-10 12:37:46,589] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +23: [2023-05-10 12:37:46,589] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. + 5: [2023-05-10 12:37:46,589] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... + 5: [2023-05-10 12:37:46,589] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +23: [2023-05-10 12:37:46,590] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt... +31: [2023-05-10 12:37:46,590] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +23: [2023-05-10 12:37:46,591] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt... +31: [2023-05-10 12:37:46,591] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. + 5: [2023-05-10 12:37:46,592] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +13: [2023-05-10 12:37:46,592] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... + 0: [2023-05-10 12:37:46,592] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt. + 0: [2023-05-10 12:37:46,592] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt. + 0: [2023-05-10 12:37:46,592] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt. +22: [2023-05-10 12:37:46,592] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt. + 7: [2023-05-10 12:37:46,592] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt. + 0: [2023-05-10 12:37:46,592] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt. +19: [2023-05-10 12:37:46,593] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +22: [2023-05-10 12:37:46,593] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt. +22: [2023-05-10 12:37:46,593] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt. +22: [2023-05-10 12:37:46,593] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt. + 7: [2023-05-10 12:37:46,593] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt. + 7: [2023-05-10 12:37:46,593] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt. + 7: [2023-05-10 12:37:46,593] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt. +31: [2023-05-10 12:37:46,594] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +31: [2023-05-10 12:37:46,594] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +24: [2023-05-10 12:37:46,595] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +18: [2023-05-10 12:37:46,596] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +18: [2023-05-10 12:37:46,596] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +18: [2023-05-10 12:37:46,596] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +12: [2023-05-10 12:37:46,596] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt. +12: [2023-05-10 12:37:46,596] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt. +12: [2023-05-10 12:37:46,596] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt. +12: [2023-05-10 12:37:46,597] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt. +24: [2023-05-10 12:37:46,597] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +31: [2023-05-10 12:37:46,599] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +31: [2023-05-10 12:37:46,600] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... + 0: [2023-05-10 12:37:46,602] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +31: [2023-05-10 12:37:46,602] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +31: [2023-05-10 12:37:46,602] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +22: [2023-05-10 12:37:46,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +22: [2023-05-10 12:37:46,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +22: [2023-05-10 12:37:46,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... + 0: [2023-05-10 12:37:46,604] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... + 0: [2023-05-10 12:37:46,604] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... + 0: [2023-05-10 12:37:46,604] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +22: [2023-05-10 12:37:46,605] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +12: [2023-05-10 12:37:46,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +12: [2023-05-10 12:37:46,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... + 7: [2023-05-10 12:37:46,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... + 7: [2023-05-10 12:37:46,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... + 7: [2023-05-10 12:37:46,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... + 7: [2023-05-10 12:37:46,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +12: [2023-05-10 12:37:46,607] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +12: [2023-05-10 12:37:46,607] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +18: [2023-05-10 12:37:46,607] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +18: [2023-05-10 12:37:46,607] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +18: [2023-05-10 12:37:46,608] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +10: [2023-05-10 12:37:46,608] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt. +10: [2023-05-10 12:37:46,608] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt. +10: [2023-05-10 12:37:46,608] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt. +10: [2023-05-10 12:37:46,610] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt. +12: [2023-05-10 12:37:46,613] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +12: [2023-05-10 12:37:46,613] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +12: [2023-05-10 12:37:46,613] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +12: [2023-05-10 12:37:46,613] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +12: [2023-05-10 12:37:46,613] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +12: [2023-05-10 12:37:46,613] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +12: [2023-05-10 12:37:46,613] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +12: [2023-05-10 12:37:46,613] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +22: [2023-05-10 12:37:46,614] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +22: [2023-05-10 12:37:46,615] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt... + 9: [2023-05-10 12:37:46,616] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt. + 9: [2023-05-10 12:37:46,616] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt. +10: [2023-05-10 12:37:46,618] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... + 9: [2023-05-10 12:37:46,619] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt. +18: [2023-05-10 12:37:46,619] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +10: [2023-05-10 12:37:46,619] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... + 9: [2023-05-10 12:37:46,619] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt. +10: [2023-05-10 12:37:46,619] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +12: [2023-05-10 12:37:46,619] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +12: [2023-05-10 12:37:46,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt... +10: [2023-05-10 12:37:46,621] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... + 0: [2023-05-10 12:37:46,623] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +22: [2023-05-10 12:37:46,623] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +22: [2023-05-10 12:37:46,623] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +22: [2023-05-10 12:37:46,623] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt... +22: [2023-05-10 12:37:46,623] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt... + 0: [2023-05-10 12:37:46,623] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt... +22: [2023-05-10 12:37:46,624] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. + 7: [2023-05-10 12:37:46,624] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +22: [2023-05-10 12:37:46,624] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt... + 7: [2023-05-10 12:37:46,624] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt... +19: [2023-05-10 12:37:46,625] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt. +19: [2023-05-10 12:37:46,625] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt. +19: [2023-05-10 12:37:46,625] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt. +19: [2023-05-10 12:37:46,626] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt. + 9: [2023-05-10 12:37:46,626] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +28: [2023-05-10 12:37:46,626] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt. +28: [2023-05-10 12:37:46,626] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt. +28: [2023-05-10 12:37:46,626] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt. + 9: [2023-05-10 12:37:46,626] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +28: [2023-05-10 12:37:46,626] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt. +18: [2023-05-10 12:37:46,628] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... + 9: [2023-05-10 12:37:46,629] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +12: [2023-05-10 12:37:46,628] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +12: [2023-05-10 12:37:46,628] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt... + 9: [2023-05-10 12:37:46,630] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... + 5: [2023-05-10 12:37:46,630] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt. + 5: [2023-05-10 12:37:46,630] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt. + 5: [2023-05-10 12:37:46,630] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt. +12: [2023-05-10 12:37:46,630] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. + 5: [2023-05-10 12:37:46,630] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt. +12: [2023-05-10 12:37:46,630] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt... + 7: [2023-05-10 12:37:46,630] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. + 7: [2023-05-10 12:37:46,630] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. + 0: [2023-05-10 12:37:46,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. + 7: [2023-05-10 12:37:46,632] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt... + 0: [2023-05-10 12:37:46,632] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. + 7: [2023-05-10 12:37:46,632] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt... +12: [2023-05-10 12:37:46,632] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +12: [2023-05-10 12:37:46,632] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt... + 8: [2023-05-10 12:37:46,633] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +12: [2023-05-10 12:37:46,633] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +12: [2023-05-10 12:37:46,633] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. + 8: [2023-05-10 12:37:46,633] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. + 0: [2023-05-10 12:37:46,633] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. + 8: [2023-05-10 12:37:46,633] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. + 8: [2023-05-10 12:37:46,633] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... + 8: [2023-05-10 12:37:46,633] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... + 8: [2023-05-10 12:37:46,633] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. + 0: [2023-05-10 12:37:46,633] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt... + 8: [2023-05-10 12:37:46,633] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +12: [2023-05-10 12:37:46,633] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. + 0: [2023-05-10 12:37:46,634] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt... + 8: [2023-05-10 12:37:46,634] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... + 7: [2023-05-10 12:37:46,634] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +19: [2023-05-10 12:37:46,634] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... + 0: [2023-05-10 12:37:46,635] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt... +28: [2023-05-10 12:37:46,635] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... + 7: [2023-05-10 12:37:46,635] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt... +18: [2023-05-10 12:37:46,635] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt. +18: [2023-05-10 12:37:46,635] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt. +18: [2023-05-10 12:37:46,635] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt. +19: [2023-05-10 12:37:46,636] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +18: [2023-05-10 12:37:46,636] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt. +28: [2023-05-10 12:37:46,636] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +28: [2023-05-10 12:37:46,636] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +19: [2023-05-10 12:37:46,636] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +19: [2023-05-10 12:37:46,637] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +10: [2023-05-10 12:37:46,637] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +10: [2023-05-10 12:37:46,638] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt... +28: [2023-05-10 12:37:46,638] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... + 9: [2023-05-10 12:37:46,639] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +12: [2023-05-10 12:37:46,639] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. + 9: [2023-05-10 12:37:46,639] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt... + 5: [2023-05-10 12:37:46,641] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... + 5: [2023-05-10 12:37:46,641] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +10: [2023-05-10 12:37:46,641] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +10: [2023-05-10 12:37:46,641] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt... + 5: [2023-05-10 12:37:46,643] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +12: [2023-05-10 12:37:46,644] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... + 5: [2023-05-10 12:37:46,643] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +12: [2023-05-10 12:37:46,644] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +12: [2023-05-10 12:37:46,644] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... + 9: [2023-05-10 12:37:46,644] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. + 9: [2023-05-10 12:37:46,644] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt... +18: [2023-05-10 12:37:46,644] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +18: [2023-05-10 12:37:46,644] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +16: [2023-05-10 12:37:46,644] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt. +10: [2023-05-10 12:37:46,645] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +18: [2023-05-10 12:37:46,647] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +10: [2023-05-10 12:37:46,647] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt... + 9: [2023-05-10 12:37:46,647] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. + 9: [2023-05-10 12:37:46,647] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt... +16: [2023-05-10 12:37:46,647] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt. +16: [2023-05-10 12:37:46,647] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt. +19: [2023-05-10 12:37:46,648] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +28: [2023-05-10 12:37:46,648] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +10: [2023-05-10 12:37:46,649] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +12: [2023-05-10 12:37:46,649] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +19: [2023-05-10 12:37:46,649] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt... +16: [2023-05-10 12:37:46,649] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt. +28: [2023-05-10 12:37:46,649] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt... +18: [2023-05-10 12:37:46,649] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +10: [2023-05-10 12:37:46,650] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt... +19: [2023-05-10 12:37:46,651] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +19: [2023-05-10 12:37:46,651] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt... +19: [2023-05-10 12:37:46,652] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +19: [2023-05-10 12:37:46,652] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt... +19: [2023-05-10 12:37:46,653] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +19: [2023-05-10 12:37:46,653] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt... + 5: [2023-05-10 12:37:46,653] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. + 9: [2023-05-10 12:37:46,653] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. + 9: [2023-05-10 12:37:46,653] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt... + 8: [2023-05-10 12:37:46,653] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. + 8: [2023-05-10 12:37:46,653] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. + 5: [2023-05-10 12:37:46,654] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt... + 8: [2023-05-10 12:37:46,654] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +28: [2023-05-10 12:37:46,654] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +28: [2023-05-10 12:37:46,654] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt... +28: [2023-05-10 12:37:46,656] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +28: [2023-05-10 12:37:46,656] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt... +16: [2023-05-10 12:37:46,656] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... + 1: [2023-05-10 12:37:46,657] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt. + 1: [2023-05-10 12:37:46,657] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt. + 4: [2023-05-10 12:37:46,657] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt. + 4: [2023-05-10 12:37:46,657] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt. +13: [2023-05-10 12:37:46,658] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt. +13: [2023-05-10 12:37:46,658] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt. +13: [2023-05-10 12:37:46,658] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt. + 4: [2023-05-10 12:37:46,658] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt. + 4: [2023-05-10 12:37:46,658] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt. +13: [2023-05-10 12:37:46,658] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt. + 5: [2023-05-10 12:37:46,659] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +18: [2023-05-10 12:37:46,659] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +16: [2023-05-10 12:37:46,659] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... + 5: [2023-05-10 12:37:46,659] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. + 5: [2023-05-10 12:37:46,659] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt... + 5: [2023-05-10 12:37:46,659] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt... +16: [2023-05-10 12:37:46,659] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +16: [2023-05-10 12:37:46,659] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +14: [2023-05-10 12:37:46,659] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt. +14: [2023-05-10 12:37:46,659] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt. +14: [2023-05-10 12:37:46,660] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt. +18: [2023-05-10 12:37:46,660] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt... +14: [2023-05-10 12:37:46,660] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt. + 1: [2023-05-10 12:37:46,662] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt. + 1: [2023-05-10 12:37:46,662] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt. + 8: [2023-05-10 12:37:46,663] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +20: [2023-05-10 12:37:46,663] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt. +20: [2023-05-10 12:37:46,663] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt. +20: [2023-05-10 12:37:46,663] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt. +28: [2023-05-10 12:37:46,662] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +20: [2023-05-10 12:37:46,663] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt. + 8: [2023-05-10 12:37:46,663] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... + 8: [2023-05-10 12:37:46,664] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +28: [2023-05-10 12:37:46,664] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt... +18: [2023-05-10 12:37:46,665] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +18: [2023-05-10 12:37:46,665] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt... + 8: [2023-05-10 12:37:46,665] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... + 1: [2023-05-10 12:37:46,666] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... + 1: [2023-05-10 12:37:46,667] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +13: [2023-05-10 12:37:46,667] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... + 4: [2023-05-10 12:37:46,667] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... + 4: [2023-05-10 12:37:46,667] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +14: [2023-05-10 12:37:46,668] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +18: [2023-05-10 12:37:46,668] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +18: [2023-05-10 12:37:46,669] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt... +13: [2023-05-10 12:37:46,669] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... + 4: [2023-05-10 12:37:46,669] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... + 4: [2023-05-10 12:37:46,669] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +14: [2023-05-10 12:37:46,670] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +25: [2023-05-10 12:37:46,670] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt. +25: [2023-05-10 12:37:46,670] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt. +13: [2023-05-10 12:37:46,670] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +14: [2023-05-10 12:37:46,670] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +14: [2023-05-10 12:37:46,670] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +13: [2023-05-10 12:37:46,670] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +25: [2023-05-10 12:37:46,671] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt. + 1: [2023-05-10 12:37:46,671] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +16: [2023-05-10 12:37:46,671] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. + 1: [2023-05-10 12:37:46,671] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... + 8: [2023-05-10 12:37:46,671] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +25: [2023-05-10 12:37:46,671] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt. +16: [2023-05-10 12:37:46,671] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt... + 5: [2023-05-10 12:37:46,671] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +20: [2023-05-10 12:37:46,672] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +20: [2023-05-10 12:37:46,672] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +20: [2023-05-10 12:37:46,673] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... + 5: [2023-05-10 12:37:46,673] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt... +20: [2023-05-10 12:37:46,673] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +16: [2023-05-10 12:37:46,674] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +16: [2023-05-10 12:37:46,674] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt... +18: [2023-05-10 12:37:46,675] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +15: [2023-05-10 12:37:46,676] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt. +15: [2023-05-10 12:37:46,677] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt. +15: [2023-05-10 12:37:46,677] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt. +15: [2023-05-10 12:37:46,677] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt. +11: [2023-05-10 12:37:46,677] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt. +11: [2023-05-10 12:37:46,677] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt. +11: [2023-05-10 12:37:46,677] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt. +26: [2023-05-10 12:37:46,677] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt. +26: [2023-05-10 12:37:46,678] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt. +26: [2023-05-10 12:37:46,678] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt. +21: [2023-05-10 12:37:46,678] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt. +18: [2023-05-10 12:37:46,677] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt... +26: [2023-05-10 12:37:46,678] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt. +21: [2023-05-10 12:37:46,678] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt. +21: [2023-05-10 12:37:46,678] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt. +21: [2023-05-10 12:37:46,678] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt. +17: [2023-05-10 12:37:46,678] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt. +17: [2023-05-10 12:37:46,679] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt. + 7: [2023-05-10 12:37:46,679] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. + 7: [2023-05-10 12:37:46,679] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... + 7: [2023-05-10 12:37:46,679] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. + 7: [2023-05-10 12:37:46,679] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. + 7: [2023-05-10 12:37:46,679] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. + 7: [2023-05-10 12:37:46,679] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +16: [2023-05-10 12:37:46,679] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. + 7: [2023-05-10 12:37:46,679] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +16: [2023-05-10 12:37:46,679] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt... +16: [2023-05-10 12:37:46,680] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +16: [2023-05-10 12:37:46,680] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt... +25: [2023-05-10 12:37:46,680] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +27: [2023-05-10 12:37:46,681] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt. +27: [2023-05-10 12:37:46,681] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt. +25: [2023-05-10 12:37:46,681] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +25: [2023-05-10 12:37:46,681] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... + 7: [2023-05-10 12:37:46,681] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +13: [2023-05-10 12:37:46,681] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +11: [2023-05-10 12:37:46,681] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt. +13: [2023-05-10 12:37:46,682] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt... +25: [2023-05-10 12:37:46,682] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +14: [2023-05-10 12:37:46,682] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +14: [2023-05-10 12:37:46,683] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt... + 1: [2023-05-10 12:37:46,682] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. + 1: [2023-05-10 12:37:46,683] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. + 4: [2023-05-10 12:37:46,682] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. + 4: [2023-05-10 12:37:46,683] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. + 1: [2023-05-10 12:37:46,683] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt... +27: [2023-05-10 12:37:46,683] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt. + 4: [2023-05-10 12:37:46,683] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt... + 4: [2023-05-10 12:37:46,683] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt... +27: [2023-05-10 12:37:46,684] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt. +14: [2023-05-10 12:37:46,684] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +14: [2023-05-10 12:37:46,684] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt... +20: [2023-05-10 12:37:46,685] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. + 1: [2023-05-10 12:37:46,685] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt... + 1: [2023-05-10 12:37:46,685] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. + 1: [2023-05-10 12:37:46,685] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt... +20: [2023-05-10 12:37:46,685] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt... + 6: [2023-05-10 12:37:46,685] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt. +13: [2023-05-10 12:37:46,685] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +13: [2023-05-10 12:37:46,686] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt... + 6: [2023-05-10 12:37:46,686] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt. + 6: [2023-05-10 12:37:46,686] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt. + 6: [2023-05-10 12:37:46,686] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt. +17: [2023-05-10 12:37:46,686] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt. +11: [2023-05-10 12:37:46,686] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +20: [2023-05-10 12:37:46,687] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +17: [2023-05-10 12:37:46,687] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_29-model_01-model_states.pt. +11: [2023-05-10 12:37:46,687] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +20: [2023-05-10 12:37:46,687] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt... +11: [2023-05-10 12:37:46,687] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +26: [2023-05-10 12:37:46,688] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +26: [2023-05-10 12:37:46,688] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +20: [2023-05-10 12:37:46,689] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +20: [2023-05-10 12:37:46,689] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt... + 4: [2023-05-10 12:37:46,689] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. + 4: [2023-05-10 12:37:46,689] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt... +20: [2023-05-10 12:37:46,689] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +20: [2023-05-10 12:37:46,689] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt... +21: [2023-05-10 12:37:46,689] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +26: [2023-05-10 12:37:46,689] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +21: [2023-05-10 12:37:46,689] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +17: [2023-05-10 12:37:46,689] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +21: [2023-05-10 12:37:46,689] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +27: [2023-05-10 12:37:46,689] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +26: [2023-05-10 12:37:46,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +11: [2023-05-10 12:37:46,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +15: [2023-05-10 12:37:46,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +27: [2023-05-10 12:37:46,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +15: [2023-05-10 12:37:46,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +21: [2023-05-10 12:37:46,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +15: [2023-05-10 12:37:46,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +17: [2023-05-10 12:37:46,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +13: [2023-05-10 12:37:46,691] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +13: [2023-05-10 12:37:46,691] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt... +25: [2023-05-10 12:37:46,691] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. + 1: [2023-05-10 12:37:46,692] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +25: [2023-05-10 12:37:46,692] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt... + 7: [2023-05-10 12:37:46,692] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. + 1: [2023-05-10 12:37:46,692] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt... +15: [2023-05-10 12:37:46,693] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +27: [2023-05-10 12:37:46,693] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +27: [2023-05-10 12:37:46,693] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... + 4: [2023-05-10 12:37:46,694] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +14: [2023-05-10 12:37:46,694] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. + 6: [2023-05-10 12:37:46,695] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... + 6: [2023-05-10 12:37:46,695] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... + 4: [2023-05-10 12:37:46,695] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt... + 6: [2023-05-10 12:37:46,695] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +20: [2023-05-10 12:37:46,696] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +20: [2023-05-10 12:37:46,696] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +14: [2023-05-10 12:37:46,696] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt... +20: [2023-05-10 12:37:46,696] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +17: [2023-05-10 12:37:46,696] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +20: [2023-05-10 12:37:46,696] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +20: [2023-05-10 12:37:46,696] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +20: [2023-05-10 12:37:46,696] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +20: [2023-05-10 12:37:46,696] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +20: [2023-05-10 12:37:46,696] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... + 6: [2023-05-10 12:37:46,697] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +17: [2023-05-10 12:37:46,697] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt... +22: [2023-05-10 12:37:46,698] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +22: [2023-05-10 12:37:46,698] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +22: [2023-05-10 12:37:46,698] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +22: [2023-05-10 12:37:46,698] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +22: [2023-05-10 12:37:46,698] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +22: [2023-05-10 12:37:46,698] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +22: [2023-05-10 12:37:46,698] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +22: [2023-05-10 12:37:46,699] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +24: [2023-05-10 12:37:46,698] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt. +24: [2023-05-10 12:37:46,698] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt. +24: [2023-05-10 12:37:46,699] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt. +14: [2023-05-10 12:37:46,698] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +13: [2023-05-10 12:37:46,699] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +24: [2023-05-10 12:37:46,699] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt. + 7: [2023-05-10 12:37:46,699] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. + 7: [2023-05-10 12:37:46,699] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +14: [2023-05-10 12:37:46,700] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt... +11: [2023-05-10 12:37:46,700] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +13: [2023-05-10 12:37:46,700] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt... +11: [2023-05-10 12:37:46,701] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt... +25: [2023-05-10 12:37:46,701] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +25: [2023-05-10 12:37:46,701] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt... +11: [2023-05-10 12:37:46,703] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +11: [2023-05-10 12:37:46,703] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt... +27: [2023-05-10 12:37:46,703] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +27: [2023-05-10 12:37:46,703] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. + 7: [2023-05-10 12:37:46,703] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +27: [2023-05-10 12:37:46,704] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt... +27: [2023-05-10 12:37:46,704] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt... +21: [2023-05-10 12:37:46,704] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +21: [2023-05-10 12:37:46,704] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +21: [2023-05-10 12:37:46,704] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +21: [2023-05-10 12:37:46,705] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt... +25: [2023-05-10 12:37:46,704] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +21: [2023-05-10 12:37:46,705] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt... +11: [2023-05-10 12:37:46,704] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +11: [2023-05-10 12:37:46,704] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +11: [2023-05-10 12:37:46,705] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt... +11: [2023-05-10 12:37:46,705] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt... +21: [2023-05-10 12:37:46,705] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt... +30: [2023-05-10 12:37:46,705] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +30: [2023-05-10 12:37:46,705] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +25: [2023-05-10 12:37:46,706] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt... +30: [2023-05-10 12:37:46,705] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +30: [2023-05-10 12:37:46,706] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +26: [2023-05-10 12:37:46,706] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +26: [2023-05-10 12:37:46,707] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +26: [2023-05-10 12:37:46,707] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt... +30: [2023-05-10 12:37:46,707] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +26: [2023-05-10 12:37:46,707] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt... +15: [2023-05-10 12:37:46,707] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +24: [2023-05-10 12:37:46,708] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +17: [2023-05-10 12:37:46,708] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +15: [2023-05-10 12:37:46,708] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt... +25: [2023-05-10 12:37:46,708] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +17: [2023-05-10 12:37:46,708] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt... +30: [2023-05-10 12:37:46,709] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +24: [2023-05-10 12:37:46,709] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +30: [2023-05-10 12:37:46,709] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +30: [2023-05-10 12:37:46,709] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... + 7: [2023-05-10 12:37:46,709] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... + 7: [2023-05-10 12:37:46,709] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +15: [2023-05-10 12:37:46,709] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +25: [2023-05-10 12:37:46,710] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt... +20: [2023-05-10 12:37:46,709] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +24: [2023-05-10 12:37:46,710] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +15: [2023-05-10 12:37:46,710] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt... +20: [2023-05-10 12:37:46,710] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +24: [2023-05-10 12:37:46,710] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +17: [2023-05-10 12:37:46,710] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +17: [2023-05-10 12:37:46,710] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt... +26: [2023-05-10 12:37:46,710] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +26: [2023-05-10 12:37:46,711] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt... +26: [2023-05-10 12:37:46,711] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +15: [2023-05-10 12:37:46,711] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +26: [2023-05-10 12:37:46,711] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt... +22: [2023-05-10 12:37:46,711] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +17: [2023-05-10 12:37:46,712] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +17: [2023-05-10 12:37:46,712] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt... +27: [2023-05-10 12:37:46,712] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +27: [2023-05-10 12:37:46,712] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +20: [2023-05-10 12:37:46,711] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +15: [2023-05-10 12:37:46,713] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt... +27: [2023-05-10 12:37:46,712] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt... +27: [2023-05-10 12:37:46,712] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt... + 6: [2023-05-10 12:37:46,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. + 6: [2023-05-10 12:37:46,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. + 6: [2023-05-10 12:37:46,715] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. + 6: [2023-05-10 12:37:46,715] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt... + 6: [2023-05-10 12:37:46,715] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt... + 6: [2023-05-10 12:37:46,715] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt... + 7: [2023-05-10 12:37:46,715] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. + 1: [2023-05-10 12:37:46,716] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. + 1: [2023-05-10 12:37:46,716] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. + 1: [2023-05-10 12:37:46,716] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... + 1: [2023-05-10 12:37:46,717] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. + 1: [2023-05-10 12:37:46,717] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. + 1: [2023-05-10 12:37:46,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +20: [2023-05-10 12:37:46,717] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. + 1: [2023-05-10 12:37:46,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +21: [2023-05-10 12:37:46,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +22: [2023-05-10 12:37:46,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +22: [2023-05-10 12:37:46,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +22: [2023-05-10 12:37:46,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. + 1: [2023-05-10 12:37:46,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +21: [2023-05-10 12:37:46,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt... +20: [2023-05-10 12:37:46,720] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +22: [2023-05-10 12:37:46,721] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +24: [2023-05-10 12:37:46,721] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +24: [2023-05-10 12:37:46,722] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt... +17: [2023-05-10 12:37:46,722] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +20: [2023-05-10 12:37:46,722] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +24: [2023-05-10 12:37:46,722] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +24: [2023-05-10 12:37:46,722] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt... +15: [2023-05-10 12:37:46,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_00-model_states.pt. +20: [2023-05-10 12:37:46,723] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +17: [2023-05-10 12:37:46,723] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt... +31: [2023-05-10 12:37:46,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt. +31: [2023-05-10 12:37:46,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt. + 7: [2023-05-10 12:37:46,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... + 6: [2023-05-10 12:37:46,725] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +31: [2023-05-10 12:37:46,725] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt. +31: [2023-05-10 12:37:46,725] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt. + 4: [2023-05-10 12:37:46,726] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. + 4: [2023-05-10 12:37:46,726] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. + 4: [2023-05-10 12:37:46,726] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... + 4: [2023-05-10 12:37:46,726] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... + 6: [2023-05-10 12:37:46,726] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt... + 4: [2023-05-10 12:37:46,726] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +15: [2023-05-10 12:37:46,726] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt... + 4: [2023-05-10 12:37:46,726] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. + 4: [2023-05-10 12:37:46,726] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... + 4: [2023-05-10 12:37:46,726] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +20: [2023-05-10 12:37:46,726] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +22: [2023-05-10 12:37:46,727] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +30: [2023-05-10 12:37:46,728] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +17: [2023-05-10 12:37:46,728] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +17: [2023-05-10 12:37:46,728] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +17: [2023-05-10 12:37:46,728] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +17: [2023-05-10 12:37:46,728] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +17: [2023-05-10 12:37:46,729] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +17: [2023-05-10 12:37:46,729] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +17: [2023-05-10 12:37:46,729] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +22: [2023-05-10 12:37:46,729] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +22: [2023-05-10 12:37:46,729] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +17: [2023-05-10 12:37:46,730] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... + 1: [2023-05-10 12:37:46,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. + 1: [2023-05-10 12:37:46,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +16: [2023-05-10 12:37:46,732] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +16: [2023-05-10 12:37:46,732] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +16: [2023-05-10 12:37:46,732] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +16: [2023-05-10 12:37:46,732] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +16: [2023-05-10 12:37:46,732] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +16: [2023-05-10 12:37:46,732] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +16: [2023-05-10 12:37:46,732] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +16: [2023-05-10 12:37:46,732] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +31: [2023-05-10 12:37:46,733] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +30: [2023-05-10 12:37:46,733] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +15: [2023-05-10 12:37:46,734] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +15: [2023-05-10 12:37:46,734] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +30: [2023-05-10 12:37:46,734] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +15: [2023-05-10 12:37:46,734] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +15: [2023-05-10 12:37:46,734] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +24: [2023-05-10 12:37:46,734] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +15: [2023-05-10 12:37:46,734] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +15: [2023-05-10 12:37:46,734] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +31: [2023-05-10 12:37:46,734] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +15: [2023-05-10 12:37:46,734] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +24: [2023-05-10 12:37:46,735] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt... +31: [2023-05-10 12:37:46,735] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +31: [2023-05-10 12:37:46,735] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +15: [2023-05-10 12:37:46,735] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +30: [2023-05-10 12:37:46,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... + 4: [2023-05-10 12:37:46,737] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +27: [2023-05-10 12:37:46,737] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +27: [2023-05-10 12:37:46,737] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +27: [2023-05-10 12:37:46,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +27: [2023-05-10 12:37:46,738] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +27: [2023-05-10 12:37:46,738] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +27: [2023-05-10 12:37:46,738] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +27: [2023-05-10 12:37:46,738] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +17: [2023-05-10 12:37:46,739] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +27: [2023-05-10 12:37:46,740] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +24: [2023-05-10 12:37:46,740] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +30: [2023-05-10 12:37:46,740] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. + 6: [2023-05-10 12:37:46,741] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. + 6: [2023-05-10 12:37:46,741] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. + 6: [2023-05-10 12:37:46,741] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... + 6: [2023-05-10 12:37:46,741] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. + 6: [2023-05-10 12:37:46,741] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... + 6: [2023-05-10 12:37:46,741] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. + 6: [2023-05-10 12:37:46,741] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +29: [2023-05-10 12:37:46,741] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt. +29: [2023-05-10 12:37:46,741] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt. +29: [2023-05-10 12:37:46,742] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt. +29: [2023-05-10 12:37:46,742] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt. +24: [2023-05-10 12:37:46,742] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt... + 6: [2023-05-10 12:37:46,742] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... + 1: [2023-05-10 12:37:46,742] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... + 1: [2023-05-10 12:37:46,743] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. + 4: [2023-05-10 12:37:46,742] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. + 1: [2023-05-10 12:37:46,743] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +30: [2023-05-10 12:37:46,744] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +30: [2023-05-10 12:37:46,744] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +16: [2023-05-10 12:37:46,744] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. + 4: [2023-05-10 12:37:46,744] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. + 4: [2023-05-10 12:37:46,744] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +17: [2023-05-10 12:37:46,745] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +17: [2023-05-10 12:37:46,745] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. + 1: [2023-05-10 12:37:46,745] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +15: [2023-05-10 12:37:46,746] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +16: [2023-05-10 12:37:46,747] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +11: [2023-05-10 12:37:46,747] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +11: [2023-05-10 12:37:46,747] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +11: [2023-05-10 12:37:46,747] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +11: [2023-05-10 12:37:46,747] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +11: [2023-05-10 12:37:46,747] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +11: [2023-05-10 12:37:46,747] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +16: [2023-05-10 12:37:46,747] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +16: [2023-05-10 12:37:46,747] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. + 4: [2023-05-10 12:37:46,747] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +31: [2023-05-10 12:37:46,749] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +27: [2023-05-10 12:37:46,749] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +31: [2023-05-10 12:37:46,750] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt... +17: [2023-05-10 12:37:46,750] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... + 0: [2023-05-10 12:37:46,750] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. + 0: [2023-05-10 12:37:46,750] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. + 0: [2023-05-10 12:37:46,750] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. + 0: [2023-05-10 12:37:46,750] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... + 0: [2023-05-10 12:37:46,750] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... + 0: [2023-05-10 12:37:46,750] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... + 0: [2023-05-10 12:37:46,750] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +30: [2023-05-10 12:37:46,750] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt. +30: [2023-05-10 12:37:46,751] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt. +31: [2023-05-10 12:37:46,751] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +29: [2023-05-10 12:37:46,751] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +27: [2023-05-10 12:37:46,751] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +29: [2023-05-10 12:37:46,751] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +31: [2023-05-10 12:37:46,751] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt... +30: [2023-05-10 12:37:46,751] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt. +30: [2023-05-10 12:37:46,751] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +29: [2023-05-10 12:37:46,752] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +29: [2023-05-10 12:37:46,752] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +30: [2023-05-10 12:37:46,752] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt. + 0: [2023-05-10 12:37:46,752] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +27: [2023-05-10 12:37:46,752] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. + 1: [2023-05-10 12:37:46,752] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +15: [2023-05-10 12:37:46,752] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +15: [2023-05-10 12:37:46,752] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +17: [2023-05-10 12:37:46,753] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +16: [2023-05-10 12:37:46,753] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... + 3: [2023-05-10 12:37:46,753] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. + 3: [2023-05-10 12:37:46,753] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. + 3: [2023-05-10 12:37:46,753] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... + 3: [2023-05-10 12:37:46,753] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. + 3: [2023-05-10 12:37:46,754] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... + 3: [2023-05-10 12:37:46,754] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... + 6: [2023-05-10 12:37:46,754] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. + 1: [2023-05-10 12:37:46,754] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... + 3: [2023-05-10 12:37:46,754] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. + 4: [2023-05-10 12:37:46,754] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... + 3: [2023-05-10 12:37:46,754] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +15: [2023-05-10 12:37:46,755] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... + 4: [2023-05-10 12:37:46,756] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... + 6: [2023-05-10 12:37:46,756] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. + 6: [2023-05-10 12:37:46,756] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. + 4: [2023-05-10 12:37:46,757] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +31: [2023-05-10 12:37:46,756] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +31: [2023-05-10 12:37:46,757] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt... +17: [2023-05-10 12:37:46,757] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +17: [2023-05-10 12:37:46,757] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +16: [2023-05-10 12:37:46,758] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +16: [2023-05-10 12:37:46,758] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +16: [2023-05-10 12:37:46,759] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +27: [2023-05-10 12:37:46,759] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +30: [2023-05-10 12:37:46,760] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +30: [2023-05-10 12:37:46,761] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +30: [2023-05-10 12:37:46,761] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +15: [2023-05-10 12:37:46,761] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +27: [2023-05-10 12:37:46,761] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +27: [2023-05-10 12:37:46,762] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +31: [2023-05-10 12:37:46,762] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +30: [2023-05-10 12:37:46,762] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +17: [2023-05-10 12:37:46,763] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +31: [2023-05-10 12:37:46,763] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt... +15: [2023-05-10 12:37:46,763] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +29: [2023-05-10 12:37:46,764] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +29: [2023-05-10 12:37:46,764] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt... +15: [2023-05-10 12:37:46,765] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. + 6: [2023-05-10 12:37:46,766] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... + 6: [2023-05-10 12:37:46,766] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... + 3: [2023-05-10 12:37:46,766] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. + 6: [2023-05-10 12:37:46,767] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... + 3: [2023-05-10 12:37:46,767] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt. + 3: [2023-05-10 12:37:46,767] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt. + 3: [2023-05-10 12:37:46,767] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt. + 3: [2023-05-10 12:37:46,768] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt. +27: [2023-05-10 12:37:46,769] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +29: [2023-05-10 12:37:46,769] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +29: [2023-05-10 12:37:46,769] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt... + 6: [2023-05-10 12:37:46,769] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +29: [2023-05-10 12:37:46,771] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +29: [2023-05-10 12:37:46,771] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt... + 0: [2023-05-10 12:37:46,772] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +30: [2023-05-10 12:37:46,773] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. + 0: [2023-05-10 12:37:46,774] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. + 0: [2023-05-10 12:37:46,774] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +15: [2023-05-10 12:37:46,774] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +30: [2023-05-10 12:37:46,774] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt... + 3: [2023-05-10 12:37:46,775] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. + 3: [2023-05-10 12:37:46,775] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. + 3: [2023-05-10 12:37:46,777] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +27: [2023-05-10 12:37:46,777] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... + 3: [2023-05-10 12:37:46,777] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +29: [2023-05-10 12:37:46,776] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +29: [2023-05-10 12:37:46,777] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt... +23: [2023-05-10 12:37:46,777] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +23: [2023-05-10 12:37:46,777] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +23: [2023-05-10 12:37:46,777] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +23: [2023-05-10 12:37:46,777] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +23: [2023-05-10 12:37:46,777] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +23: [2023-05-10 12:37:46,777] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +23: [2023-05-10 12:37:46,777] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +23: [2023-05-10 12:37:46,777] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... + 6: [2023-05-10 12:37:46,778] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +30: [2023-05-10 12:37:46,778] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. + 3: [2023-05-10 12:37:46,778] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +30: [2023-05-10 12:37:46,778] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt... +21: [2023-05-10 12:37:46,778] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +25: [2023-05-10 12:37:46,778] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +25: [2023-05-10 12:37:46,778] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +25: [2023-05-10 12:37:46,778] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +21: [2023-05-10 12:37:46,778] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +21: [2023-05-10 12:37:46,778] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +21: [2023-05-10 12:37:46,778] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +25: [2023-05-10 12:37:46,778] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +25: [2023-05-10 12:37:46,778] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +21: [2023-05-10 12:37:46,778] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +25: [2023-05-10 12:37:46,778] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +14: [2023-05-10 12:37:46,778] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +14: [2023-05-10 12:37:46,778] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +21: [2023-05-10 12:37:46,778] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +21: [2023-05-10 12:37:46,778] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +14: [2023-05-10 12:37:46,778] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +25: [2023-05-10 12:37:46,778] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +14: [2023-05-10 12:37:46,778] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +21: [2023-05-10 12:37:46,779] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... + 3: [2023-05-10 12:37:46,779] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +25: [2023-05-10 12:37:46,779] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +14: [2023-05-10 12:37:46,780] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +14: [2023-05-10 12:37:46,780] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +14: [2023-05-10 12:37:46,780] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... + 5: [2023-05-10 12:37:46,780] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. + 5: [2023-05-10 12:37:46,780] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +14: [2023-05-10 12:37:46,780] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... + 5: [2023-05-10 12:37:46,780] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... + 5: [2023-05-10 12:37:46,780] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. + 5: [2023-05-10 12:37:46,780] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... + 5: [2023-05-10 12:37:46,780] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. + 3: [2023-05-10 12:37:46,780] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. + 5: [2023-05-10 12:37:46,781] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... + 5: [2023-05-10 12:37:46,782] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +29: [2023-05-10 12:37:46,782] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +29: [2023-05-10 12:37:46,782] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +29: [2023-05-10 12:37:46,782] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +29: [2023-05-10 12:37:46,782] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... + 3: [2023-05-10 12:37:46,782] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... + 0: [2023-05-10 12:37:46,783] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +29: [2023-05-10 12:37:46,783] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +29: [2023-05-10 12:37:46,784] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +29: [2023-05-10 12:37:46,784] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... + 0: [2023-05-10 12:37:46,784] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +29: [2023-05-10 12:37:46,785] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... + 0: [2023-05-10 12:37:46,785] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +23: [2023-05-10 12:37:46,786] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt. +23: [2023-05-10 12:37:46,786] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt. + 3: [2023-05-10 12:37:46,786] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... + 3: [2023-05-10 12:37:46,786] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +30: [2023-05-10 12:37:46,786] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +30: [2023-05-10 12:37:46,787] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt... +23: [2023-05-10 12:37:46,787] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt. +23: [2023-05-10 12:37:46,787] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt. +23: [2023-05-10 12:37:46,790] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. + 3: [2023-05-10 12:37:46,790] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +25: [2023-05-10 12:37:46,790] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +30: [2023-05-10 12:37:46,790] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. + 0: [2023-05-10 12:37:46,791] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. + 9: [2023-05-10 12:37:46,791] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +11: [2023-05-10 12:37:46,748] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +11: [2023-05-10 12:37:46,749] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... + 9: [2023-05-10 12:37:46,791] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. + 9: [2023-05-10 12:37:46,791] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +11: [2023-05-10 12:37:46,761] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +11: [2023-05-10 12:37:46,761] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +11: [2023-05-10 12:37:46,772] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +11: [2023-05-10 12:37:46,773] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +11: [2023-05-10 12:37:46,775] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +11: [2023-05-10 12:37:46,781] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +11: [2023-05-10 12:37:46,784] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +11: [2023-05-10 12:37:46,790] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... + 9: [2023-05-10 12:37:46,791] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +30: [2023-05-10 12:37:46,792] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt... + 9: [2023-05-10 12:37:46,792] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. + 9: [2023-05-10 12:37:46,792] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. + 9: [2023-05-10 12:37:46,792] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +21: [2023-05-10 12:37:46,791] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +21: [2023-05-10 12:37:46,792] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. + 9: [2023-05-10 12:37:46,793] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... + 3: [2023-05-10 12:37:46,793] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. + 5: [2023-05-10 12:37:46,793] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +25: [2023-05-10 12:37:46,794] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +25: [2023-05-10 12:37:46,794] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. + 3: [2023-05-10 12:37:46,794] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt... +29: [2023-05-10 12:37:46,794] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +21: [2023-05-10 12:37:46,794] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +21: [2023-05-10 12:37:46,794] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +14: [2023-05-10 12:37:46,794] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +14: [2023-05-10 12:37:46,794] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +14: [2023-05-10 12:37:46,794] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. + 5: [2023-05-10 12:37:46,794] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +31: [2023-05-10 12:37:46,795] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +31: [2023-05-10 12:37:46,795] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +31: [2023-05-10 12:37:46,795] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +31: [2023-05-10 12:37:46,795] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +31: [2023-05-10 12:37:46,795] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +31: [2023-05-10 12:37:46,795] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +31: [2023-05-10 12:37:46,795] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... + 3: [2023-05-10 12:37:46,796] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. + 3: [2023-05-10 12:37:46,796] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt... +23: [2023-05-10 12:37:46,796] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +23: [2023-05-10 12:37:46,796] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +23: [2023-05-10 12:37:46,796] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +31: [2023-05-10 12:37:46,796] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +23: [2023-05-10 12:37:46,797] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +28: [2023-05-10 12:37:46,798] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +28: [2023-05-10 12:37:46,798] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +28: [2023-05-10 12:37:46,798] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +28: [2023-05-10 12:37:46,798] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +28: [2023-05-10 12:37:46,798] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +28: [2023-05-10 12:37:46,798] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +25: [2023-05-10 12:37:46,798] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +23: [2023-05-10 12:37:46,799] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +23: [2023-05-10 12:37:46,799] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... + 0: [2023-05-10 12:37:46,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +28: [2023-05-10 12:37:46,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +28: [2023-05-10 12:37:46,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +23: [2023-05-10 12:37:46,801] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +14: [2023-05-10 12:37:46,801] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +25: [2023-05-10 12:37:46,802] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +21: [2023-05-10 12:37:46,802] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +21: [2023-05-10 12:37:46,802] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +29: [2023-05-10 12:37:46,803] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +19: [2023-05-10 12:37:46,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. + 5: [2023-05-10 12:37:46,803] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +19: [2023-05-10 12:37:46,803] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +29: [2023-05-10 12:37:46,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +29: [2023-05-10 12:37:46,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +19: [2023-05-10 12:37:46,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +19: [2023-05-10 12:37:46,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +19: [2023-05-10 12:37:46,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +19: [2023-05-10 12:37:46,803] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... + 9: [2023-05-10 12:37:46,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +19: [2023-05-10 12:37:46,803] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +19: [2023-05-10 12:37:46,803] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +14: [2023-05-10 12:37:46,804] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +21: [2023-05-10 12:37:46,804] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... + 5: [2023-05-10 12:37:46,804] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +14: [2023-05-10 12:37:46,804] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +14: [2023-05-10 12:37:46,804] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... + 9: [2023-05-10 12:37:46,804] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +25: [2023-05-10 12:37:46,805] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +21: [2023-05-10 12:37:46,805] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... + 9: [2023-05-10 12:37:46,805] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +23: [2023-05-10 12:37:46,805] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. + 3: [2023-05-10 12:37:46,806] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +25: [2023-05-10 12:37:46,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... + 3: [2023-05-10 12:37:46,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt... + 5: [2023-05-10 12:37:46,807] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +31: [2023-05-10 12:37:46,808] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +10: [2023-05-10 12:37:46,808] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +10: [2023-05-10 12:37:46,808] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +10: [2023-05-10 12:37:46,808] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +10: [2023-05-10 12:37:46,808] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +13: [2023-05-10 12:37:46,808] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +13: [2023-05-10 12:37:46,808] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +13: [2023-05-10 12:37:46,808] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +13: [2023-05-10 12:37:46,808] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +13: [2023-05-10 12:37:46,808] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +13: [2023-05-10 12:37:46,809] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +13: [2023-05-10 12:37:46,809] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +13: [2023-05-10 12:37:46,809] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +29: [2023-05-10 12:37:46,809] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +18: [2023-05-10 12:37:46,810] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +18: [2023-05-10 12:37:46,810] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +18: [2023-05-10 12:37:46,810] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +18: [2023-05-10 12:37:46,810] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +18: [2023-05-10 12:37:46,810] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +18: [2023-05-10 12:37:46,810] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +18: [2023-05-10 12:37:46,810] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +18: [2023-05-10 12:37:46,810] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +31: [2023-05-10 12:37:46,810] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +14: [2023-05-10 12:37:46,810] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +10: [2023-05-10 12:37:46,810] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +10: [2023-05-10 12:37:46,810] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +31: [2023-05-10 12:37:46,810] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +28: [2023-05-10 12:37:46,811] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +25: [2023-05-10 12:37:46,811] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +29: [2023-05-10 12:37:46,812] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... + 9: [2023-05-10 12:37:46,811] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... + 3: [2023-05-10 12:37:46,812] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +29: [2023-05-10 12:37:46,812] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +10: [2023-05-10 12:37:46,812] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +24: [2023-05-10 12:37:46,812] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +24: [2023-05-10 12:37:46,812] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +24: [2023-05-10 12:37:46,812] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +24: [2023-05-10 12:37:46,812] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +24: [2023-05-10 12:37:46,812] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +24: [2023-05-10 12:37:46,812] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +23: [2023-05-10 12:37:46,813] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +10: [2023-05-10 12:37:46,813] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... + 5: [2023-05-10 12:37:46,813] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. + 3: [2023-05-10 12:37:46,813] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt... +24: [2023-05-10 12:37:46,814] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +19: [2023-05-10 12:37:46,814] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. + 9: [2023-05-10 12:37:46,814] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... + 9: [2023-05-10 12:37:46,815] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +19: [2023-05-10 12:37:46,815] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +24: [2023-05-10 12:37:46,815] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +23: [2023-05-10 12:37:46,815] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... + 5: [2023-05-10 12:37:46,816] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +31: [2023-05-10 12:37:46,816] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... + 2: [2023-05-10 12:37:46,816] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt. + 2: [2023-05-10 12:37:46,816] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt. + 2: [2023-05-10 12:37:46,816] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt. + 2: [2023-05-10 12:37:46,816] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt. +28: [2023-05-10 12:37:46,816] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. + 9: [2023-05-10 12:37:46,817] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +19: [2023-05-10 12:37:46,818] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +29: [2023-05-10 12:37:46,818] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +19: [2023-05-10 12:37:46,819] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +28: [2023-05-10 12:37:46,819] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +31: [2023-05-10 12:37:46,819] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +31: [2023-05-10 12:37:46,819] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... + 8: [2023-05-10 12:37:46,819] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. + 8: [2023-05-10 12:37:46,819] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... + 8: [2023-05-10 12:37:46,819] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. + 8: [2023-05-10 12:37:46,820] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +23: [2023-05-10 12:37:46,820] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. + 8: [2023-05-10 12:37:46,820] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +26: [2023-05-10 12:37:46,820] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. + 8: [2023-05-10 12:37:46,820] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +23: [2023-05-10 12:37:46,820] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +26: [2023-05-10 12:37:46,820] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... + 8: [2023-05-10 12:37:46,820] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... + 8: [2023-05-10 12:37:46,820] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +13: [2023-05-10 12:37:46,820] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +23: [2023-05-10 12:37:46,820] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt... +26: [2023-05-10 12:37:46,820] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +26: [2023-05-10 12:37:46,820] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +31: [2023-05-10 12:37:46,821] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +23: [2023-05-10 12:37:46,822] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +23: [2023-05-10 12:37:46,822] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt... +26: [2023-05-10 12:37:46,822] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. + 2: [2023-05-10 12:37:46,822] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. + 2: [2023-05-10 12:37:46,822] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +26: [2023-05-10 12:37:46,822] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. + 5: [2023-05-10 12:37:46,822] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +26: [2023-05-10 12:37:46,822] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +19: [2023-05-10 12:37:46,823] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +20: [2023-05-10 12:37:46,823] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +20: [2023-05-10 12:37:46,823] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +26: [2023-05-10 12:37:46,823] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... + 2: [2023-05-10 12:37:46,823] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. + 2: [2023-05-10 12:37:46,823] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... + 7: [2023-05-10 12:37:46,823] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. + 7: [2023-05-10 12:37:46,823] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. + 2: [2023-05-10 12:37:46,824] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +20: [2023-05-10 12:37:46,824] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. + 7: [2023-05-10 12:37:46,824] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... + 7: [2023-05-10 12:37:46,824] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +20: [2023-05-10 12:37:46,824] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... + 7: [2023-05-10 12:37:46,824] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. + 7: [2023-05-10 12:37:46,824] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. + 7: [2023-05-10 12:37:46,824] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... + 2: [2023-05-10 12:37:46,824] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +10: [2023-05-10 12:37:46,824] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +19: [2023-05-10 12:37:46,825] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +23: [2023-05-10 12:37:46,825] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +23: [2023-05-10 12:37:46,825] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. + 7: [2023-05-10 12:37:46,825] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... + 2: [2023-05-10 12:37:46,825] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +20: [2023-05-10 12:37:46,825] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +23: [2023-05-10 12:37:46,825] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt... +23: [2023-05-10 12:37:46,825] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt... +20: [2023-05-10 12:37:46,825] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +24: [2023-05-10 12:37:46,825] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. + 9: [2023-05-10 12:37:46,826] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... + 2: [2023-05-10 12:37:46,826] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +24: [2023-05-10 12:37:46,826] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +28: [2023-05-10 12:37:46,826] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... + 2: [2023-05-10 12:37:46,826] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +20: [2023-05-10 12:37:46,827] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +20: [2023-05-10 12:37:46,827] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +19: [2023-05-10 12:37:46,827] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +19: [2023-05-10 12:37:46,828] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +13: [2023-05-10 12:37:46,828] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +13: [2023-05-10 12:37:46,828] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. + 2: [2023-05-10 12:37:46,828] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... + 2: [2023-05-10 12:37:46,828] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +13: [2023-05-10 12:37:46,828] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +13: [2023-05-10 12:37:46,828] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... + 2: [2023-05-10 12:37:46,829] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +24: [2023-05-10 12:37:46,830] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +28: [2023-05-10 12:37:46,830] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. + 8: [2023-05-10 12:37:46,830] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +31: [2023-05-10 12:37:46,831] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +26: [2023-05-10 12:37:46,831] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +12: [2023-05-10 12:37:46,831] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +12: [2023-05-10 12:37:46,831] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +10: [2023-05-10 12:37:46,831] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +12: [2023-05-10 12:37:46,831] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +12: [2023-05-10 12:37:46,831] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +12: [2023-05-10 12:37:46,832] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +12: [2023-05-10 12:37:46,833] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +18: [2023-05-10 12:37:46,833] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +18: [2023-05-10 12:37:46,833] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +18: [2023-05-10 12:37:46,833] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +18: [2023-05-10 12:37:46,833] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +12: [2023-05-10 12:37:46,833] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +12: [2023-05-10 12:37:46,833] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +24: [2023-05-10 12:37:46,834] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +10: [2023-05-10 12:37:46,834] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +26: [2023-05-10 12:37:46,834] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +26: [2023-05-10 12:37:46,835] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +20: [2023-05-10 12:37:46,836] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +20: [2023-05-10 12:37:46,837] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +24: [2023-05-10 12:37:46,837] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +28: [2023-05-10 12:37:46,837] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +13: [2023-05-10 12:37:46,837] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... + 8: [2023-05-10 12:37:46,839] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. + 8: [2023-05-10 12:37:46,839] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +13: [2023-05-10 12:37:46,839] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +24: [2023-05-10 12:37:46,839] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... + 8: [2023-05-10 12:37:46,839] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +26: [2023-05-10 12:37:46,839] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +28: [2023-05-10 12:37:46,839] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +13: [2023-05-10 12:37:46,840] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... + 8: [2023-05-10 12:37:46,840] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +10: [2023-05-10 12:37:46,841] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +10: [2023-05-10 12:37:46,841] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +22: [2023-05-10 12:37:46,842] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +22: [2023-05-10 12:37:46,842] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +22: [2023-05-10 12:37:46,842] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +22: [2023-05-10 12:37:46,842] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +22: [2023-05-10 12:37:46,842] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +22: [2023-05-10 12:37:46,842] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +24: [2023-05-10 12:37:46,843] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. + 7: [2023-05-10 12:37:46,843] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. + 7: [2023-05-10 12:37:46,843] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. + 7: [2023-05-10 12:37:46,843] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +22: [2023-05-10 12:37:46,843] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +18: [2023-05-10 12:37:46,843] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +18: [2023-05-10 12:37:46,843] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +22: [2023-05-10 12:37:46,844] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +18: [2023-05-10 12:37:46,844] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +26: [2023-05-10 12:37:46,844] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +12: [2023-05-10 12:37:46,845] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +26: [2023-05-10 12:37:46,845] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +18: [2023-05-10 12:37:46,845] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +28: [2023-05-10 12:37:46,846] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... + 2: [2023-05-10 12:37:46,846] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. + 2: [2023-05-10 12:37:46,847] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt... +20: [2023-05-10 12:37:46,847] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +20: [2023-05-10 12:37:46,848] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... + 8: [2023-05-10 12:37:46,849] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +10: [2023-05-10 12:37:46,849] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. + 8: [2023-05-10 12:37:46,849] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... + 2: [2023-05-10 12:37:46,849] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. + 2: [2023-05-10 12:37:46,849] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. + 8: [2023-05-10 12:37:46,850] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... + 7: [2023-05-10 12:37:46,850] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +26: [2023-05-10 12:37:46,851] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. + 7: [2023-05-10 12:37:46,851] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt. + 7: [2023-05-10 12:37:46,851] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt. + 7: [2023-05-10 12:37:46,851] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt. +10: [2023-05-10 12:37:46,852] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... + 2: [2023-05-10 12:37:46,852] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. + 2: [2023-05-10 12:37:46,852] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt... +20: [2023-05-10 12:37:46,853] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. + 7: [2023-05-10 12:37:46,853] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +22: [2023-05-10 12:37:46,853] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. + 2: [2023-05-10 12:37:46,853] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. + 7: [2023-05-10 12:37:46,854] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +24: [2023-05-10 12:37:46,855] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +12: [2023-05-10 12:37:46,855] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... + 7: [2023-05-10 12:37:46,855] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +15: [2023-05-10 12:37:46,856] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +15: [2023-05-10 12:37:46,856] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +15: [2023-05-10 12:37:46,856] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +15: [2023-05-10 12:37:46,856] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +15: [2023-05-10 12:37:46,856] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +15: [2023-05-10 12:37:46,856] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. + 2: [2023-05-10 12:37:46,856] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. + 7: [2023-05-10 12:37:46,856] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt. +15: [2023-05-10 12:37:46,856] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... + 2: [2023-05-10 12:37:46,857] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. + 2: [2023-05-10 12:37:46,857] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +20: [2023-05-10 12:37:46,857] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +12: [2023-05-10 12:37:46,858] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +12: [2023-05-10 12:37:46,858] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +10: [2023-05-10 12:37:46,858] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +15: [2023-05-10 12:37:46,857] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... + 2: [2023-05-10 12:37:46,859] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... + 2: [2023-05-10 12:37:46,859] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +22: [2023-05-10 12:37:46,859] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. + 2: [2023-05-10 12:37:46,859] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt... + 2: [2023-05-10 12:37:46,860] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt... +26: [2023-05-10 12:37:46,860] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... + 7: [2023-05-10 12:37:46,861] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +12: [2023-05-10 12:37:46,862] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. + 7: [2023-05-10 12:37:46,862] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... + 7: [2023-05-10 12:37:46,862] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +20: [2023-05-10 12:37:46,862] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... + 7: [2023-05-10 12:37:46,862] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +22: [2023-05-10 12:37:46,863] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +11: [2023-05-10 12:37:46,864] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +11: [2023-05-10 12:37:46,864] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... + 2: [2023-05-10 12:37:46,865] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... + 2: [2023-05-10 12:37:46,865] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +20: [2023-05-10 12:37:46,866] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... + 7: [2023-05-10 12:37:46,866] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +11: [2023-05-10 12:37:46,867] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +11: [2023-05-10 12:37:46,867] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +15: [2023-05-10 12:37:46,867] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +30: [2023-05-10 12:37:46,868] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +30: [2023-05-10 12:37:46,868] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +30: [2023-05-10 12:37:46,868] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +30: [2023-05-10 12:37:46,868] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +11: [2023-05-10 12:37:46,868] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +30: [2023-05-10 12:37:46,868] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +30: [2023-05-10 12:37:46,868] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +30: [2023-05-10 12:37:46,868] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +30: [2023-05-10 12:37:46,868] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +11: [2023-05-10 12:37:46,868] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +11: [2023-05-10 12:37:46,868] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +11: [2023-05-10 12:37:46,870] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +12: [2023-05-10 12:37:46,870] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +12: [2023-05-10 12:37:46,870] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +22: [2023-05-10 12:37:46,871] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +12: [2023-05-10 12:37:46,871] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +16: [2023-05-10 12:37:46,872] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +16: [2023-05-10 12:37:46,872] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +16: [2023-05-10 12:37:46,872] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +16: [2023-05-10 12:37:46,872] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +16: [2023-05-10 12:37:46,872] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +16: [2023-05-10 12:37:46,872] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +16: [2023-05-10 12:37:46,872] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +16: [2023-05-10 12:37:46,872] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +15: [2023-05-10 12:37:46,873] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +22: [2023-05-10 12:37:46,873] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +22: [2023-05-10 12:37:46,874] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +12: [2023-05-10 12:37:46,875] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt. +12: [2023-05-10 12:37:46,875] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt. +12: [2023-05-10 12:37:46,875] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt. +12: [2023-05-10 12:37:46,875] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt. + 7: [2023-05-10 12:37:46,876] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +15: [2023-05-10 12:37:46,876] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... + 7: [2023-05-10 12:37:46,877] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt... +15: [2023-05-10 12:37:46,878] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +11: [2023-05-10 12:37:46,878] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +30: [2023-05-10 12:37:46,880] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. + 7: [2023-05-10 12:37:46,880] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. + 7: [2023-05-10 12:37:46,880] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. + 7: [2023-05-10 12:37:46,880] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt... + 7: [2023-05-10 12:37:46,880] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt... + 0: [2023-05-10 12:37:46,880] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. + 0: [2023-05-10 12:37:46,880] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. + 0: [2023-05-10 12:37:46,880] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... + 0: [2023-05-10 12:37:46,880] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. + 0: [2023-05-10 12:37:46,880] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +11: [2023-05-10 12:37:46,880] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. + 0: [2023-05-10 12:37:46,881] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +17: [2023-05-10 12:37:46,881] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +17: [2023-05-10 12:37:46,882] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... + 0: [2023-05-10 12:37:46,882] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +22: [2023-05-10 12:37:46,883] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +22: [2023-05-10 12:37:46,883] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +15: [2023-05-10 12:37:46,883] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +11: [2023-05-10 12:37:46,883] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. + 0: [2023-05-10 12:37:46,883] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +16: [2023-05-10 12:37:46,883] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. + 7: [2023-05-10 12:37:46,885] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. + 7: [2023-05-10 12:37:46,885] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt... +30: [2023-05-10 12:37:46,885] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +17: [2023-05-10 12:37:46,885] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +23: [2023-05-10 12:37:46,886] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +23: [2023-05-10 12:37:46,886] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +23: [2023-05-10 12:37:46,886] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +23: [2023-05-10 12:37:46,887] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +16: [2023-05-10 12:37:46,887] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +30: [2023-05-10 12:37:46,887] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +30: [2023-05-10 12:37:46,887] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +12: [2023-05-10 12:37:46,887] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +12: [2023-05-10 12:37:46,887] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +17: [2023-05-10 12:37:46,887] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +17: [2023-05-10 12:37:46,887] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +17: [2023-05-10 12:37:46,887] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +14: [2023-05-10 12:37:46,887] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +14: [2023-05-10 12:37:46,887] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +14: [2023-05-10 12:37:46,887] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +15: [2023-05-10 12:37:46,887] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +14: [2023-05-10 12:37:46,888] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +14: [2023-05-10 12:37:46,888] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +14: [2023-05-10 12:37:46,888] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +16: [2023-05-10 12:37:46,888] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +14: [2023-05-10 12:37:46,888] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +14: [2023-05-10 12:37:46,888] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +16: [2023-05-10 12:37:46,888] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +17: [2023-05-10 12:37:46,888] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +17: [2023-05-10 12:37:46,888] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +11: [2023-05-10 12:37:46,888] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +15: [2023-05-10 12:37:46,888] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +12: [2023-05-10 12:37:46,889] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +30: [2023-05-10 12:37:46,889] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +12: [2023-05-10 12:37:46,890] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +23: [2023-05-10 12:37:46,890] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +23: [2023-05-10 12:37:46,890] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +11: [2023-05-10 12:37:46,890] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +23: [2023-05-10 12:37:46,891] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +23: [2023-05-10 12:37:46,891] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +11: [2023-05-10 12:37:46,892] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +22: [2023-05-10 12:37:46,893] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt. +22: [2023-05-10 12:37:46,893] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt. +22: [2023-05-10 12:37:46,893] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt. +22: [2023-05-10 12:37:46,893] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt. +17: [2023-05-10 12:37:46,893] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +16: [2023-05-10 12:37:46,894] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +10: [2023-05-10 12:37:46,895] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt. +10: [2023-05-10 12:37:46,895] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt. +10: [2023-05-10 12:37:46,895] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt. +10: [2023-05-10 12:37:46,895] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt. +11: [2023-05-10 12:37:46,896] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. + 9: [2023-05-10 12:37:46,896] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt. + 9: [2023-05-10 12:37:46,896] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt. + 9: [2023-05-10 12:37:46,896] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt. + 9: [2023-05-10 12:37:46,896] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt. +15: [2023-05-10 12:37:46,897] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +16: [2023-05-10 12:37:46,897] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +23: [2023-05-10 12:37:46,897] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +16: [2023-05-10 12:37:46,898] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +16: [2023-05-10 12:37:46,898] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +30: [2023-05-10 12:37:46,898] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +30: [2023-05-10 12:37:46,899] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +23: [2023-05-10 12:37:46,899] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +12: [2023-05-10 12:37:46,899] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +12: [2023-05-10 12:37:46,900] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt... +12: [2023-05-10 12:37:46,900] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +12: [2023-05-10 12:37:46,900] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt... +30: [2023-05-10 12:37:46,900] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... + 0: [2023-05-10 12:37:46,901] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. + 0: [2023-05-10 12:37:46,901] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +14: [2023-05-10 12:37:46,902] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +22: [2023-05-10 12:37:46,902] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +14: [2023-05-10 12:37:46,902] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +17: [2023-05-10 12:37:46,904] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +11: [2023-05-10 12:37:46,904] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +10: [2023-05-10 12:37:46,905] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +10: [2023-05-10 12:37:46,905] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +22: [2023-05-10 12:37:46,905] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +14: [2023-05-10 12:37:46,905] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +10: [2023-05-10 12:37:46,905] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +14: [2023-05-10 12:37:46,905] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +10: [2023-05-10 12:37:46,905] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +22: [2023-05-10 12:37:46,906] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... + 9: [2023-05-10 12:37:46,906] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +22: [2023-05-10 12:37:46,906] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... + 0: [2023-05-10 12:37:46,908] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt. + 5: [2023-05-10 12:37:46,908] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. + 5: [2023-05-10 12:37:46,908] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. + 5: [2023-05-10 12:37:46,908] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... + 5: [2023-05-10 12:37:46,908] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... + 9: [2023-05-10 12:37:46,908] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... + 5: [2023-05-10 12:37:46,908] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. + 5: [2023-05-10 12:37:46,908] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... + 9: [2023-05-10 12:37:46,909] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... + 5: [2023-05-10 12:37:46,909] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. + 5: [2023-05-10 12:37:46,909] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +21: [2023-05-10 12:37:46,909] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +21: [2023-05-10 12:37:46,909] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +21: [2023-05-10 12:37:46,909] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +21: [2023-05-10 12:37:46,909] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +21: [2023-05-10 12:37:46,909] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +21: [2023-05-10 12:37:46,909] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. + 9: [2023-05-10 12:37:46,910] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +21: [2023-05-10 12:37:46,910] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... + 0: [2023-05-10 12:37:46,910] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt. +21: [2023-05-10 12:37:46,911] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +23: [2023-05-10 12:37:46,911] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +14: [2023-05-10 12:37:46,912] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... + 0: [2023-05-10 12:37:46,912] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +13: [2023-05-10 12:37:46,912] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +13: [2023-05-10 12:37:46,912] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +25: [2023-05-10 12:37:46,913] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +25: [2023-05-10 12:37:46,913] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... + 5: [2023-05-10 12:37:46,913] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt. + 5: [2023-05-10 12:37:46,913] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt. +25: [2023-05-10 12:37:46,914] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +25: [2023-05-10 12:37:46,914] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +17: [2023-05-10 12:37:46,914] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +14: [2023-05-10 12:37:46,914] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +13: [2023-05-10 12:37:46,914] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +13: [2023-05-10 12:37:46,915] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... + 0: [2023-05-10 12:37:46,915] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +23: [2023-05-10 12:37:46,915] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +19: [2023-05-10 12:37:46,915] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt. + 0: [2023-05-10 12:37:46,915] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt. +19: [2023-05-10 12:37:46,915] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt. +17: [2023-05-10 12:37:46,915] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +19: [2023-05-10 12:37:46,915] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt. +13: [2023-05-10 12:37:46,915] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +13: [2023-05-10 12:37:46,915] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +13: [2023-05-10 12:37:46,915] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... + 0: [2023-05-10 12:37:46,915] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt. +19: [2023-05-10 12:37:46,916] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +19: [2023-05-10 12:37:46,916] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +19: [2023-05-10 12:37:46,916] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +19: [2023-05-10 12:37:46,916] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt. +12: [2023-05-10 12:37:46,916] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +12: [2023-05-10 12:37:46,916] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +19: [2023-05-10 12:37:46,916] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +19: [2023-05-10 12:37:46,916] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +19: [2023-05-10 12:37:46,916] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +23: [2023-05-10 12:37:46,917] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +13: [2023-05-10 12:37:46,917] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +14: [2023-05-10 12:37:46,917] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +14: [2023-05-10 12:37:46,917] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... + 8: [2023-05-10 12:37:46,917] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt. + 8: [2023-05-10 12:37:46,917] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt. + 8: [2023-05-10 12:37:46,917] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt. +25: [2023-05-10 12:37:46,917] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +25: [2023-05-10 12:37:46,917] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. + 8: [2023-05-10 12:37:46,917] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt. + 5: [2023-05-10 12:37:46,917] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt. +12: [2023-05-10 12:37:46,918] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt... +12: [2023-05-10 12:37:46,918] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt... +19: [2023-05-10 12:37:46,918] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. + 0: [2023-05-10 12:37:46,918] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +19: [2023-05-10 12:37:46,918] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... + 5: [2023-05-10 12:37:46,918] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt. +25: [2023-05-10 12:37:46,919] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +23: [2023-05-10 12:37:46,919] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +25: [2023-05-10 12:37:46,919] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +22: [2023-05-10 12:37:46,920] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +17: [2023-05-10 12:37:46,920] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. + 0: [2023-05-10 12:37:46,920] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +22: [2023-05-10 12:37:46,920] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt... +10: [2023-05-10 12:37:46,921] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +10: [2023-05-10 12:37:46,921] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. + 9: [2023-05-10 12:37:46,921] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +10: [2023-05-10 12:37:46,922] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt... + 9: [2023-05-10 12:37:46,922] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt... +10: [2023-05-10 12:37:46,922] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +10: [2023-05-10 12:37:46,922] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt... +10: [2023-05-10 12:37:46,922] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +10: [2023-05-10 12:37:46,922] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt... +10: [2023-05-10 12:37:46,922] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt... +17: [2023-05-10 12:37:46,923] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... + 5: [2023-05-10 12:37:46,924] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +20: [2023-05-10 12:37:46,924] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt. + 5: [2023-05-10 12:37:46,924] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +20: [2023-05-10 12:37:46,924] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt. +20: [2023-05-10 12:37:46,924] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt. +20: [2023-05-10 12:37:46,925] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt. +13: [2023-05-10 12:37:46,925] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. + 5: [2023-05-10 12:37:46,925] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. + 5: [2023-05-10 12:37:46,925] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +13: [2023-05-10 12:37:46,925] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt. +17: [2023-05-10 12:37:46,925] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +19: [2023-05-10 12:37:46,926] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +19: [2023-05-10 12:37:46,926] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... + 8: [2023-05-10 12:37:46,926] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +25: [2023-05-10 12:37:46,926] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. + 0: [2023-05-10 12:37:46,926] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +25: [2023-05-10 12:37:46,926] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +13: [2023-05-10 12:37:46,926] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt. +19: [2023-05-10 12:37:46,926] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +23: [2023-05-10 12:37:46,927] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +14: [2023-05-10 12:37:46,927] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt. +14: [2023-05-10 12:37:46,927] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt. + 0: [2023-05-10 12:37:46,927] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. + 0: [2023-05-10 12:37:46,927] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +22: [2023-05-10 12:37:46,927] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +13: [2023-05-10 12:37:46,927] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt. +21: [2023-05-10 12:37:46,927] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +22: [2023-05-10 12:37:46,927] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt... +23: [2023-05-10 12:37:46,928] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +18: [2023-05-10 12:37:46,928] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt. +18: [2023-05-10 12:37:46,928] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt. +28: [2023-05-10 12:37:46,928] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt. +21: [2023-05-10 12:37:46,928] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +28: [2023-05-10 12:37:46,928] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt. + 8: [2023-05-10 12:37:46,928] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +28: [2023-05-10 12:37:46,928] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt. +19: [2023-05-10 12:37:46,928] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +18: [2023-05-10 12:37:46,928] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt. + 8: [2023-05-10 12:37:46,928] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +18: [2023-05-10 12:37:46,928] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt. +13: [2023-05-10 12:37:46,928] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt. +28: [2023-05-10 12:37:46,929] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt. +17: [2023-05-10 12:37:46,929] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +22: [2023-05-10 12:37:46,929] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. + 8: [2023-05-10 12:37:46,929] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +14: [2023-05-10 12:37:46,929] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt. +14: [2023-05-10 12:37:46,929] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt. +22: [2023-05-10 12:37:46,931] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt... + 5: [2023-05-10 12:37:46,931] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +25: [2023-05-10 12:37:46,932] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt. +25: [2023-05-10 12:37:46,932] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt. + 9: [2023-05-10 12:37:46,932] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. + 5: [2023-05-10 12:37:46,933] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +22: [2023-05-10 12:37:46,933] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +11: [2023-05-10 12:37:46,933] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt. + 9: [2023-05-10 12:37:46,934] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt... +11: [2023-05-10 12:37:46,934] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt. +11: [2023-05-10 12:37:46,934] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt. +11: [2023-05-10 12:37:46,934] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt. +19: [2023-05-10 12:37:46,934] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. + 5: [2023-05-10 12:37:46,935] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... + 9: [2023-05-10 12:37:46,935] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +20: [2023-05-10 12:37:46,935] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +22: [2023-05-10 12:37:46,935] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt... +14: [2023-05-10 12:37:46,936] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +25: [2023-05-10 12:37:46,936] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +19: [2023-05-10 12:37:46,936] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +25: [2023-05-10 12:37:46,936] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... + 4: [2023-05-10 12:37:46,936] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt. + 4: [2023-05-10 12:37:46,936] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt. + 4: [2023-05-10 12:37:46,936] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt. + 5: [2023-05-10 12:37:46,937] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +18: [2023-05-10 12:37:46,937] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +18: [2023-05-10 12:37:46,937] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... + 9: [2023-05-10 12:37:46,936] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. + 9: [2023-05-10 12:37:46,937] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt... +25: [2023-05-10 12:37:46,937] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt. +21: [2023-05-10 12:37:46,937] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... + 0: [2023-05-10 12:37:46,937] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. + 0: [2023-05-10 12:37:46,937] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +20: [2023-05-10 12:37:46,938] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +21: [2023-05-10 12:37:46,938] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +21: [2023-05-10 12:37:46,938] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. + 9: [2023-05-10 12:37:46,938] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt... +20: [2023-05-10 12:37:46,938] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +13: [2023-05-10 12:37:46,938] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +14: [2023-05-10 12:37:46,938] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +19: [2023-05-10 12:37:46,938] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +19: [2023-05-10 12:37:46,938] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +25: [2023-05-10 12:37:46,938] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt. +20: [2023-05-10 12:37:46,938] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +28: [2023-05-10 12:37:46,939] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +14: [2023-05-10 12:37:46,939] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +14: [2023-05-10 12:37:46,939] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +28: [2023-05-10 12:37:46,939] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... + 4: [2023-05-10 12:37:46,939] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt. +18: [2023-05-10 12:37:46,939] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +28: [2023-05-10 12:37:46,939] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +18: [2023-05-10 12:37:46,939] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... + 5: [2023-05-10 12:37:46,940] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +13: [2023-05-10 12:37:46,940] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +13: [2023-05-10 12:37:46,940] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +18: [2023-05-10 12:37:46,940] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +21: [2023-05-10 12:37:46,940] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +18: [2023-05-10 12:37:46,940] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +18: [2023-05-10 12:37:46,940] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +18: [2023-05-10 12:37:46,940] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... + 0: [2023-05-10 12:37:46,940] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +18: [2023-05-10 12:37:46,940] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +13: [2023-05-10 12:37:46,940] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +13: [2023-05-10 12:37:46,941] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +13: [2023-05-10 12:37:46,941] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... + 0: [2023-05-10 12:37:46,941] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. + 0: [2023-05-10 12:37:46,941] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt... + 0: [2023-05-10 12:37:46,941] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt... + 8: [2023-05-10 12:37:46,941] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +28: [2023-05-10 12:37:46,942] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +18: [2023-05-10 12:37:46,942] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +27: [2023-05-10 12:37:46,942] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt. +27: [2023-05-10 12:37:46,942] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt. + 8: [2023-05-10 12:37:46,942] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt... +27: [2023-05-10 12:37:46,942] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt. +27: [2023-05-10 12:37:46,942] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt. +25: [2023-05-10 12:37:46,942] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +18: [2023-05-10 12:37:46,942] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +25: [2023-05-10 12:37:46,943] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +11: [2023-05-10 12:37:46,944] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +11: [2023-05-10 12:37:46,944] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +19: [2023-05-10 12:37:46,944] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +19: [2023-05-10 12:37:46,944] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +11: [2023-05-10 12:37:46,944] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... + 8: [2023-05-10 12:37:46,945] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. + 8: [2023-05-10 12:37:46,945] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt... +11: [2023-05-10 12:37:46,945] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +19: [2023-05-10 12:37:46,946] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt... +18: [2023-05-10 12:37:46,945] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +25: [2023-05-10 12:37:46,946] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... + 4: [2023-05-10 12:37:46,947] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +21: [2023-05-10 12:37:46,947] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... + 0: [2023-05-10 12:37:46,947] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +14: [2023-05-10 12:37:46,948] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. + 4: [2023-05-10 12:37:46,948] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... + 4: [2023-05-10 12:37:46,948] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... + 5: [2023-05-10 12:37:46,948] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +14: [2023-05-10 12:37:46,948] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt... +25: [2023-05-10 12:37:46,948] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... + 5: [2023-05-10 12:37:46,948] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. + 4: [2023-05-10 12:37:46,949] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... + 5: [2023-05-10 12:37:46,949] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt... +21: [2023-05-10 12:37:46,949] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +17: [2023-05-10 12:37:46,949] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt. +17: [2023-05-10 12:37:46,949] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt. +25: [2023-05-10 12:37:46,950] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +19: [2023-05-10 12:37:46,950] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. + 5: [2023-05-10 12:37:46,950] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. + 8: [2023-05-10 12:37:46,950] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +13: [2023-05-10 12:37:46,950] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +17: [2023-05-10 12:37:46,950] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt. + 8: [2023-05-10 12:37:46,950] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt... +25: [2023-05-10 12:37:46,951] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +27: [2023-05-10 12:37:46,951] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +19: [2023-05-10 12:37:46,950] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +19: [2023-05-10 12:37:46,951] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +19: [2023-05-10 12:37:46,951] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt... +28: [2023-05-10 12:37:46,951] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +13: [2023-05-10 12:37:46,951] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +17: [2023-05-10 12:37:46,951] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt. + 5: [2023-05-10 12:37:46,951] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +28: [2023-05-10 12:37:46,951] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt... + 5: [2023-05-10 12:37:46,951] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt... +19: [2023-05-10 12:37:46,952] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt... +19: [2023-05-10 12:37:46,952] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +27: [2023-05-10 12:37:46,952] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +27: [2023-05-10 12:37:46,952] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +28: [2023-05-10 12:37:46,952] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. + 0: [2023-05-10 12:37:46,952] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. + 0: [2023-05-10 12:37:46,952] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +28: [2023-05-10 12:37:46,952] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt... + 0: [2023-05-10 12:37:46,952] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt... + 0: [2023-05-10 12:37:46,952] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt... +27: [2023-05-10 12:37:46,952] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +28: [2023-05-10 12:37:46,953] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +28: [2023-05-10 12:37:46,953] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt... +18: [2023-05-10 12:37:46,953] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +18: [2023-05-10 12:37:46,953] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +14: [2023-05-10 12:37:46,953] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +18: [2023-05-10 12:37:46,953] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt... +18: [2023-05-10 12:37:46,953] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt... +14: [2023-05-10 12:37:46,954] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt... +16: [2023-05-10 12:37:46,954] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt. +16: [2023-05-10 12:37:46,954] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt. +16: [2023-05-10 12:37:46,954] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt. +19: [2023-05-10 12:37:46,954] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +16: [2023-05-10 12:37:46,954] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt. + 8: [2023-05-10 12:37:46,954] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. + 8: [2023-05-10 12:37:46,955] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt... +13: [2023-05-10 12:37:46,955] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +13: [2023-05-10 12:37:46,956] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt... +21: [2023-05-10 12:37:46,956] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt. +21: [2023-05-10 12:37:46,956] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt. +25: [2023-05-10 12:37:46,956] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +21: [2023-05-10 12:37:46,957] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt. +21: [2023-05-10 12:37:46,957] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt. +25: [2023-05-10 12:37:46,957] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt... +15: [2023-05-10 12:37:46,957] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt. +15: [2023-05-10 12:37:46,957] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt. + 5: [2023-05-10 12:37:46,958] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +11: [2023-05-10 12:37:46,958] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. + 5: [2023-05-10 12:37:46,958] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt... +11: [2023-05-10 12:37:46,958] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +11: [2023-05-10 12:37:46,958] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt... +11: [2023-05-10 12:37:46,958] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt... +20: [2023-05-10 12:37:46,959] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. + 5: [2023-05-10 12:37:46,959] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +14: [2023-05-10 12:37:46,960] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +14: [2023-05-10 12:37:46,960] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt... +25: [2023-05-10 12:37:46,960] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +17: [2023-05-10 12:37:46,960] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +25: [2023-05-10 12:37:46,960] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt... +13: [2023-05-10 12:37:46,960] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +20: [2023-05-10 12:37:46,961] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt... +25: [2023-05-10 12:37:46,960] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +11: [2023-05-10 12:37:46,961] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +11: [2023-05-10 12:37:46,961] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt... +25: [2023-05-10 12:37:46,961] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +14: [2023-05-10 12:37:46,961] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +20: [2023-05-10 12:37:46,962] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +20: [2023-05-10 12:37:46,962] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +15: [2023-05-10 12:37:46,962] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt. +15: [2023-05-10 12:37:46,962] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_30-model_01-model_states.pt. +19: [2023-05-10 12:37:46,962] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +14: [2023-05-10 12:37:46,963] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt... +17: [2023-05-10 12:37:46,963] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +17: [2023-05-10 12:37:46,963] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +17: [2023-05-10 12:37:46,963] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +20: [2023-05-10 12:37:46,963] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt... +20: [2023-05-10 12:37:46,963] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt... +16: [2023-05-10 12:37:46,964] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +19: [2023-05-10 12:37:46,964] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt... +27: [2023-05-10 12:37:46,964] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +27: [2023-05-10 12:37:46,965] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt... +21: [2023-05-10 12:37:46,965] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +16: [2023-05-10 12:37:46,966] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +16: [2023-05-10 12:37:46,966] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +16: [2023-05-10 12:37:46,966] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +21: [2023-05-10 12:37:46,966] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +15: [2023-05-10 12:37:46,966] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +21: [2023-05-10 12:37:46,966] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... + 4: [2023-05-10 12:37:46,966] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. + 4: [2023-05-10 12:37:46,966] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +20: [2023-05-10 12:37:46,967] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. + 4: [2023-05-10 12:37:46,967] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt... + 4: [2023-05-10 12:37:46,967] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt... +25: [2023-05-10 12:37:46,967] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +25: [2023-05-10 12:37:46,967] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt... +13: [2023-05-10 12:37:46,967] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +13: [2023-05-10 12:37:46,967] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +13: [2023-05-10 12:37:46,967] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt... +13: [2023-05-10 12:37:46,967] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt... + 4: [2023-05-10 12:37:46,967] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. + 4: [2023-05-10 12:37:46,967] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt... +21: [2023-05-10 12:37:46,967] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +11: [2023-05-10 12:37:46,967] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +28: [2023-05-10 12:37:46,968] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +27: [2023-05-10 12:37:46,968] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +27: [2023-05-10 12:37:46,968] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt... +11: [2023-05-10 12:37:46,969] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt... +20: [2023-05-10 12:37:46,969] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt... +15: [2023-05-10 12:37:46,969] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +28: [2023-05-10 12:37:46,969] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt... +13: [2023-05-10 12:37:46,970] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +27: [2023-05-10 12:37:46,971] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +27: [2023-05-10 12:37:46,971] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt... + 5: [2023-05-10 12:37:46,971] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +13: [2023-05-10 12:37:46,972] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +18: [2023-05-10 12:37:46,972] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +18: [2023-05-10 12:37:46,972] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt... +15: [2023-05-10 12:37:46,972] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +15: [2023-05-10 12:37:46,972] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt... +25: [2023-05-10 12:37:46,972] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +25: [2023-05-10 12:37:46,973] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt... + 5: [2023-05-10 12:37:46,973] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt... +17: [2023-05-10 12:37:46,973] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +27: [2023-05-10 12:37:46,974] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +17: [2023-05-10 12:37:46,974] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt... +27: [2023-05-10 12:37:46,974] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt... +13: [2023-05-10 12:37:46,974] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt... +18: [2023-05-10 12:37:46,973] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +18: [2023-05-10 12:37:46,974] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +18: [2023-05-10 12:37:46,974] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt... + 4: [2023-05-10 12:37:46,975] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. + 4: [2023-05-10 12:37:46,976] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt... +21: [2023-05-10 12:37:46,977] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +16: [2023-05-10 12:37:46,977] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +16: [2023-05-10 12:37:46,977] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt... +21: [2023-05-10 12:37:46,977] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt... +17: [2023-05-10 12:37:46,978] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +17: [2023-05-10 12:37:46,978] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +17: [2023-05-10 12:37:46,978] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt... +17: [2023-05-10 12:37:46,978] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt... +13: [2023-05-10 12:37:46,978] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +16: [2023-05-10 12:37:46,979] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +16: [2023-05-10 12:37:46,980] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt... +15: [2023-05-10 12:37:46,980] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +16: [2023-05-10 12:37:46,981] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +16: [2023-05-10 12:37:46,981] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +16: [2023-05-10 12:37:46,981] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt... +16: [2023-05-10 12:37:46,981] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt... +18: [2023-05-10 12:37:46,981] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +21: [2023-05-10 12:37:46,981] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +21: [2023-05-10 12:37:46,981] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +21: [2023-05-10 12:37:46,981] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt... +21: [2023-05-10 12:37:46,981] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt... +15: [2023-05-10 12:37:46,982] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt... +18: [2023-05-10 12:37:46,984] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +15: [2023-05-10 12:37:46,988] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +15: [2023-05-10 12:37:46,988] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt... +17: [2023-05-10 12:37:46,988] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +17: [2023-05-10 12:37:46,989] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt... +18: [2023-05-10 12:37:46,990] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +18: [2023-05-10 12:37:46,991] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +15: [2023-05-10 12:37:46,992] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +15: [2023-05-10 12:37:46,992] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt... +21: [2023-05-10 12:37:46,994] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +21: [2023-05-10 12:37:46,996] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt... +15: [2023-05-10 12:37:46,996] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_00-model_states.pt. +15: [2023-05-10 12:37:46,996] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt... +18: [2023-05-10 12:37:46,999] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +18: [2023-05-10 12:37:47,002] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +18: [2023-05-10 12:37:47,007] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... + 6: [2023-05-10 12:37:47,014] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt. + 6: [2023-05-10 12:37:47,014] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt. + 6: [2023-05-10 12:37:47,014] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt. + 6: [2023-05-10 12:37:47,014] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt. + 6: [2023-05-10 12:37:47,023] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... + 6: [2023-05-10 12:37:47,023] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... + 6: [2023-05-10 12:37:47,024] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... + 6: [2023-05-10 12:37:47,025] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... + 3: [2023-05-10 12:37:47,029] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt. + 3: [2023-05-10 12:37:47,029] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt. + 3: [2023-05-10 12:37:47,030] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt. + 3: [2023-05-10 12:37:47,030] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt. + 1: [2023-05-10 12:37:47,030] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt. + 1: [2023-05-10 12:37:47,030] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt. + 1: [2023-05-10 12:37:47,031] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt. + 1: [2023-05-10 12:37:47,031] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt. + 6: [2023-05-10 12:37:47,036] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. + 6: [2023-05-10 12:37:47,036] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt... + 3: [2023-05-10 12:37:47,039] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... + 1: [2023-05-10 12:37:47,040] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... + 1: [2023-05-10 12:37:47,040] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... + 1: [2023-05-10 12:37:47,040] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... + 3: [2023-05-10 12:37:47,040] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... + 6: [2023-05-10 12:37:47,041] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. + 6: [2023-05-10 12:37:47,041] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt... + 3: [2023-05-10 12:37:47,041] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... + 3: [2023-05-10 12:37:47,041] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +30: [2023-05-10 12:37:47,042] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt. +30: [2023-05-10 12:37:47,042] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt. +30: [2023-05-10 12:37:47,042] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt. + 1: [2023-05-10 12:37:47,042] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +30: [2023-05-10 12:37:47,042] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt. + 6: [2023-05-10 12:37:47,046] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. + 6: [2023-05-10 12:37:47,046] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt... + 6: [2023-05-10 12:37:47,047] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. + 6: [2023-05-10 12:37:47,048] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt... +30: [2023-05-10 12:37:47,051] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +30: [2023-05-10 12:37:47,052] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... + 3: [2023-05-10 12:37:47,053] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. + 3: [2023-05-10 12:37:47,053] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt... + 3: [2023-05-10 12:37:47,053] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +30: [2023-05-10 12:37:47,053] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... + 3: [2023-05-10 12:37:47,054] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt... + 1: [2023-05-10 12:37:47,054] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. + 1: [2023-05-10 12:37:47,055] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt... +30: [2023-05-10 12:37:47,055] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... + 1: [2023-05-10 12:37:47,057] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. + 1: [2023-05-10 12:37:47,057] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt... + 1: [2023-05-10 12:37:47,060] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. + 1: [2023-05-10 12:37:47,060] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt... + 3: [2023-05-10 12:37:47,064] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. + 3: [2023-05-10 12:37:47,065] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. + 3: [2023-05-10 12:37:47,066] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt... + 3: [2023-05-10 12:37:47,066] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt... + 1: [2023-05-10 12:37:47,066] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. + 1: [2023-05-10 12:37:47,067] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt... +24: [2023-05-10 12:37:47,068] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt. +24: [2023-05-10 12:37:47,068] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt. +30: [2023-05-10 12:37:47,068] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +30: [2023-05-10 12:37:47,069] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt... +24: [2023-05-10 12:37:47,069] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt. +24: [2023-05-10 12:37:47,069] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt. +30: [2023-05-10 12:37:47,074] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +30: [2023-05-10 12:37:47,074] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt... +30: [2023-05-10 12:37:47,074] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +30: [2023-05-10 12:37:47,074] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt... +24: [2023-05-10 12:37:47,077] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +24: [2023-05-10 12:37:47,077] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +24: [2023-05-10 12:37:47,078] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +24: [2023-05-10 12:37:47,079] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... + 4: [2023-05-10 12:37:47,079] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. + 4: [2023-05-10 12:37:47,079] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +30: [2023-05-10 12:37:47,081] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. + 4: [2023-05-10 12:37:47,081] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. + 4: [2023-05-10 12:37:47,081] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +30: [2023-05-10 12:37:47,083] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt... +29: [2023-05-10 12:37:47,085] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt. +29: [2023-05-10 12:37:47,085] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt. +29: [2023-05-10 12:37:47,085] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt. +29: [2023-05-10 12:37:47,085] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt. + 4: [2023-05-10 12:37:47,085] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. + 4: [2023-05-10 12:37:47,085] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. + 4: [2023-05-10 12:37:47,087] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... + 4: [2023-05-10 12:37:47,087] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +24: [2023-05-10 12:37:47,090] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +24: [2023-05-10 12:37:47,091] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +24: [2023-05-10 12:37:47,091] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt... +24: [2023-05-10 12:37:47,092] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt... +24: [2023-05-10 12:37:47,092] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +24: [2023-05-10 12:37:47,093] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt... +24: [2023-05-10 12:37:47,093] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +24: [2023-05-10 12:37:47,093] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt... +29: [2023-05-10 12:37:47,095] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +29: [2023-05-10 12:37:47,095] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +29: [2023-05-10 12:37:47,095] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +29: [2023-05-10 12:37:47,096] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... + 4: [2023-05-10 12:37:47,096] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. + 4: [2023-05-10 12:37:47,098] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +27: [2023-05-10 12:37:47,099] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +27: [2023-05-10 12:37:47,100] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +27: [2023-05-10 12:37:47,100] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +27: [2023-05-10 12:37:47,102] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +27: [2023-05-10 12:37:47,102] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +27: [2023-05-10 12:37:47,102] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +27: [2023-05-10 12:37:47,102] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +27: [2023-05-10 12:37:47,102] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... + 4: [2023-05-10 12:37:47,106] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... + 4: [2023-05-10 12:37:47,107] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... + 4: [2023-05-10 12:37:47,111] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +27: [2023-05-10 12:37:47,113] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +27: [2023-05-10 12:37:47,114] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +29: [2023-05-10 12:37:47,115] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +29: [2023-05-10 12:37:47,116] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt... + 4: [2023-05-10 12:37:47,117] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +27: [2023-05-10 12:37:47,118] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +29: [2023-05-10 12:37:47,119] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +29: [2023-05-10 12:37:47,119] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt... +29: [2023-05-10 12:37:47,119] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +29: [2023-05-10 12:37:47,119] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt... +29: [2023-05-10 12:37:47,120] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +29: [2023-05-10 12:37:47,121] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt... + 4: [2023-05-10 12:37:47,122] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +27: [2023-05-10 12:37:47,122] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +23: [2023-05-10 12:37:47,122] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt. +23: [2023-05-10 12:37:47,122] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt. +23: [2023-05-10 12:37:47,122] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt. +23: [2023-05-10 12:37:47,122] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt. +27: [2023-05-10 12:37:47,123] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... + 4: [2023-05-10 12:37:47,128] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +27: [2023-05-10 12:37:47,128] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +23: [2023-05-10 12:37:47,131] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +23: [2023-05-10 12:37:47,132] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +23: [2023-05-10 12:37:47,132] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +23: [2023-05-10 12:37:47,133] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +31: [2023-05-10 12:37:47,133] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +31: [2023-05-10 12:37:47,134] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +31: [2023-05-10 12:37:47,134] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +31: [2023-05-10 12:37:47,134] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +27: [2023-05-10 12:37:47,134] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +24: [2023-05-10 12:37:47,134] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +24: [2023-05-10 12:37:47,134] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +31: [2023-05-10 12:37:47,134] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +31: [2023-05-10 12:37:47,134] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +24: [2023-05-10 12:37:47,134] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +24: [2023-05-10 12:37:47,134] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +24: [2023-05-10 12:37:47,134] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +31: [2023-05-10 12:37:47,134] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +24: [2023-05-10 12:37:47,134] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +24: [2023-05-10 12:37:47,134] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +24: [2023-05-10 12:37:47,134] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +31: [2023-05-10 12:37:47,135] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... + 3: [2023-05-10 12:37:47,137] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. + 3: [2023-05-10 12:37:47,137] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. + 3: [2023-05-10 12:37:47,137] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. + 3: [2023-05-10 12:37:47,137] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... + 3: [2023-05-10 12:37:47,137] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... + 3: [2023-05-10 12:37:47,137] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +10: [2023-05-10 12:37:47,139] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt. + 3: [2023-05-10 12:37:47,139] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +10: [2023-05-10 12:37:47,139] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt. +10: [2023-05-10 12:37:47,140] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt. +10: [2023-05-10 12:37:47,140] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt. + 3: [2023-05-10 12:37:47,140] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +27: [2023-05-10 12:37:47,144] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +31: [2023-05-10 12:37:47,145] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +24: [2023-05-10 12:37:47,146] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +23: [2023-05-10 12:37:47,147] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +23: [2023-05-10 12:37:47,147] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt... +22: [2023-05-10 12:37:47,147] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt. +22: [2023-05-10 12:37:47,148] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt. +22: [2023-05-10 12:37:47,148] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt. +24: [2023-05-10 12:37:47,148] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +22: [2023-05-10 12:37:47,148] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt. +10: [2023-05-10 12:37:47,149] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +23: [2023-05-10 12:37:47,149] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +23: [2023-05-10 12:37:47,149] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +23: [2023-05-10 12:37:47,149] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt... +23: [2023-05-10 12:37:47,149] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt... +31: [2023-05-10 12:37:47,149] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +31: [2023-05-10 12:37:47,149] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +24: [2023-05-10 12:37:47,150] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +24: [2023-05-10 12:37:47,150] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. + 2: [2023-05-10 12:37:47,151] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +31: [2023-05-10 12:37:47,151] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +10: [2023-05-10 12:37:47,151] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... + 2: [2023-05-10 12:37:47,151] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. + 2: [2023-05-10 12:37:47,151] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... + 2: [2023-05-10 12:37:47,151] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... + 2: [2023-05-10 12:37:47,152] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. + 2: [2023-05-10 12:37:47,152] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. + 2: [2023-05-10 12:37:47,152] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... + 2: [2023-05-10 12:37:47,152] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +10: [2023-05-10 12:37:47,152] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +23: [2023-05-10 12:37:47,152] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +10: [2023-05-10 12:37:47,152] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +23: [2023-05-10 12:37:47,152] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt... +15: [2023-05-10 12:37:47,155] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +15: [2023-05-10 12:37:47,155] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +15: [2023-05-10 12:37:47,155] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +15: [2023-05-10 12:37:47,155] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +15: [2023-05-10 12:37:47,155] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +15: [2023-05-10 12:37:47,155] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +15: [2023-05-10 12:37:47,155] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +15: [2023-05-10 12:37:47,156] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +31: [2023-05-10 12:37:47,156] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +26: [2023-05-10 12:37:47,156] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt. + 3: [2023-05-10 12:37:47,156] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. + 3: [2023-05-10 12:37:47,156] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. + 3: [2023-05-10 12:37:47,156] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +26: [2023-05-10 12:37:47,156] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt. +26: [2023-05-10 12:37:47,156] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt. +24: [2023-05-10 12:37:47,156] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +22: [2023-05-10 12:37:47,157] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +24: [2023-05-10 12:37:47,157] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +26: [2023-05-10 12:37:47,158] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt. +22: [2023-05-10 12:37:47,158] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +22: [2023-05-10 12:37:47,158] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +22: [2023-05-10 12:37:47,158] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +24: [2023-05-10 12:37:47,160] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +31: [2023-05-10 12:37:47,161] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +31: [2023-05-10 12:37:47,162] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... + 2: [2023-05-10 12:37:47,162] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +31: [2023-05-10 12:37:47,162] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +24: [2023-05-10 12:37:47,162] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... + 2: [2023-05-10 12:37:47,163] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. + 3: [2023-05-10 12:37:47,164] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. + 3: [2023-05-10 12:37:47,165] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +10: [2023-05-10 12:37:47,165] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +10: [2023-05-10 12:37:47,165] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +10: [2023-05-10 12:37:47,165] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +10: [2023-05-10 12:37:47,165] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +10: [2023-05-10 12:37:47,165] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +10: [2023-05-10 12:37:47,165] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +10: [2023-05-10 12:37:47,165] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +10: [2023-05-10 12:37:47,166] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +10: [2023-05-10 12:37:47,166] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +10: [2023-05-10 12:37:47,166] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt... + 3: [2023-05-10 12:37:47,167] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +15: [2023-05-10 12:37:47,167] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. + 2: [2023-05-10 12:37:47,167] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. + 2: [2023-05-10 12:37:47,167] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +20: [2023-05-10 12:37:47,167] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +20: [2023-05-10 12:37:47,167] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +20: [2023-05-10 12:37:47,168] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +20: [2023-05-10 12:37:47,168] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +20: [2023-05-10 12:37:47,168] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +20: [2023-05-10 12:37:47,168] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. + 7: [2023-05-10 12:37:47,168] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt. +20: [2023-05-10 12:37:47,168] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +20: [2023-05-10 12:37:47,168] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... + 3: [2023-05-10 12:37:47,168] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... + 7: [2023-05-10 12:37:47,168] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt. + 7: [2023-05-10 12:37:47,168] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt. + 7: [2023-05-10 12:37:47,168] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt. +26: [2023-05-10 12:37:47,168] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +26: [2023-05-10 12:37:47,168] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +26: [2023-05-10 12:37:47,169] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +26: [2023-05-10 12:37:47,169] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +22: [2023-05-10 12:37:47,172] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. + 3: [2023-05-10 12:37:47,173] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +22: [2023-05-10 12:37:47,173] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt... + 2: [2023-05-10 12:37:47,172] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +15: [2023-05-10 12:37:47,174] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +30: [2023-05-10 12:37:47,174] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. + 2: [2023-05-10 12:37:47,174] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +30: [2023-05-10 12:37:47,174] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +22: [2023-05-10 12:37:47,175] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +22: [2023-05-10 12:37:47,175] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +30: [2023-05-10 12:37:47,175] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +15: [2023-05-10 12:37:47,175] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +15: [2023-05-10 12:37:47,175] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +15: [2023-05-10 12:37:47,175] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +22: [2023-05-10 12:37:47,175] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +22: [2023-05-10 12:37:47,175] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +22: [2023-05-10 12:37:47,175] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +22: [2023-05-10 12:37:47,176] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +22: [2023-05-10 12:37:47,176] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +11: [2023-05-10 12:37:47,176] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +11: [2023-05-10 12:37:47,176] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +11: [2023-05-10 12:37:47,176] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +11: [2023-05-10 12:37:47,176] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +11: [2023-05-10 12:37:47,176] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +11: [2023-05-10 12:37:47,176] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +11: [2023-05-10 12:37:47,176] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +11: [2023-05-10 12:37:47,176] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +10: [2023-05-10 12:37:47,176] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +30: [2023-05-10 12:37:47,177] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +29: [2023-05-10 12:37:47,177] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +29: [2023-05-10 12:37:47,176] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +29: [2023-05-10 12:37:47,177] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +29: [2023-05-10 12:37:47,177] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... + 2: [2023-05-10 12:37:47,177] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... + 2: [2023-05-10 12:37:47,177] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +30: [2023-05-10 12:37:47,177] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +30: [2023-05-10 12:37:47,178] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +22: [2023-05-10 12:37:47,178] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... + 7: [2023-05-10 12:37:47,178] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +10: [2023-05-10 12:37:47,178] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt... +28: [2023-05-10 12:37:47,178] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +28: [2023-05-10 12:37:47,178] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +28: [2023-05-10 12:37:47,178] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +28: [2023-05-10 12:37:47,178] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +28: [2023-05-10 12:37:47,178] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +28: [2023-05-10 12:37:47,178] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +28: [2023-05-10 12:37:47,178] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +28: [2023-05-10 12:37:47,178] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +10: [2023-05-10 12:37:47,178] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. + 6: [2023-05-10 12:37:47,179] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. + 6: [2023-05-10 12:37:47,179] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. + 6: [2023-05-10 12:37:47,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... + 6: [2023-05-10 12:37:47,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +22: [2023-05-10 12:37:47,179] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +22: [2023-05-10 12:37:47,179] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. + 6: [2023-05-10 12:37:47,179] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +22: [2023-05-10 12:37:47,179] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +22: [2023-05-10 12:37:47,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt... +22: [2023-05-10 12:37:47,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt... +22: [2023-05-10 12:37:47,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt... +30: [2023-05-10 12:37:47,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +10: [2023-05-10 12:37:47,180] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. + 6: [2023-05-10 12:37:47,180] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. + 7: [2023-05-10 12:37:47,180] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... + 7: [2023-05-10 12:37:47,180] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +29: [2023-05-10 12:37:47,180] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +29: [2023-05-10 12:37:47,180] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +29: [2023-05-10 12:37:47,180] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +29: [2023-05-10 12:37:47,180] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... + 7: [2023-05-10 12:37:47,180] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +10: [2023-05-10 12:37:47,180] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. + 6: [2023-05-10 12:37:47,180] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +30: [2023-05-10 12:37:47,180] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +26: [2023-05-10 12:37:47,180] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +26: [2023-05-10 12:37:47,181] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt... + 6: [2023-05-10 12:37:47,181] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +10: [2023-05-10 12:37:47,181] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt... +10: [2023-05-10 12:37:47,182] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt... +20: [2023-05-10 12:37:47,184] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +20: [2023-05-10 12:37:47,184] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +10: [2023-05-10 12:37:47,184] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +15: [2023-05-10 12:37:47,185] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +20: [2023-05-10 12:37:47,185] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +10: [2023-05-10 12:37:47,186] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +10: [2023-05-10 12:37:47,186] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +26: [2023-05-10 12:37:47,186] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +26: [2023-05-10 12:37:47,186] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt... +22: [2023-05-10 12:37:47,187] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +15: [2023-05-10 12:37:47,187] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +15: [2023-05-10 12:37:47,188] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +26: [2023-05-10 12:37:47,188] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. + 7: [2023-05-10 12:37:47,189] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +26: [2023-05-10 12:37:47,190] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt... + 7: [2023-05-10 12:37:47,190] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt... +12: [2023-05-10 12:37:47,190] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +12: [2023-05-10 12:37:47,190] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +12: [2023-05-10 12:37:47,190] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +12: [2023-05-10 12:37:47,190] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +12: [2023-05-10 12:37:47,190] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +30: [2023-05-10 12:37:47,190] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +12: [2023-05-10 12:37:47,190] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +12: [2023-05-10 12:37:47,190] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +12: [2023-05-10 12:37:47,190] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +26: [2023-05-10 12:37:47,191] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +28: [2023-05-10 12:37:47,191] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +26: [2023-05-10 12:37:47,191] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt... +10: [2023-05-10 12:37:47,191] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +11: [2023-05-10 12:37:47,192] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +11: [2023-05-10 12:37:47,192] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +29: [2023-05-10 12:37:47,192] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +20: [2023-05-10 12:37:47,192] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +11: [2023-05-10 12:37:47,192] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +11: [2023-05-10 12:37:47,192] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +22: [2023-05-10 12:37:47,193] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +29: [2023-05-10 12:37:47,193] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +22: [2023-05-10 12:37:47,193] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +29: [2023-05-10 12:37:47,193] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +29: [2023-05-10 12:37:47,193] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. + 6: [2023-05-10 12:37:47,193] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. + 6: [2023-05-10 12:37:47,193] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +20: [2023-05-10 12:37:47,195] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +10: [2023-05-10 12:37:47,195] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +10: [2023-05-10 12:37:47,195] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +20: [2023-05-10 12:37:47,196] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +20: [2023-05-10 12:37:47,196] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +10: [2023-05-10 12:37:47,198] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +28: [2023-05-10 12:37:47,198] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +30: [2023-05-10 12:37:47,199] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +30: [2023-05-10 12:37:47,200] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +28: [2023-05-10 12:37:47,200] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +22: [2023-05-10 12:37:47,201] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +11: [2023-05-10 12:37:47,201] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +20: [2023-05-10 12:37:47,201] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +11: [2023-05-10 12:37:47,202] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +29: [2023-05-10 12:37:47,202] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +11: [2023-05-10 12:37:47,202] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +11: [2023-05-10 12:37:47,202] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... + 6: [2023-05-10 12:37:47,203] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... + 7: [2023-05-10 12:37:47,203] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +29: [2023-05-10 12:37:47,204] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... + 6: [2023-05-10 12:37:47,204] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +22: [2023-05-10 12:37:47,204] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... + 7: [2023-05-10 12:37:47,204] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. + 7: [2023-05-10 12:37:47,205] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +29: [2023-05-10 12:37:47,205] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... + 7: [2023-05-10 12:37:47,205] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt... +28: [2023-05-10 12:37:47,205] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +29: [2023-05-10 12:37:47,205] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... + 6: [2023-05-10 12:37:47,205] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt. + 6: [2023-05-10 12:37:47,205] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt. + 6: [2023-05-10 12:37:47,205] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt. + 6: [2023-05-10 12:37:47,206] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt. + 8: [2023-05-10 12:37:47,206] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt. + 8: [2023-05-10 12:37:47,206] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt. + 8: [2023-05-10 12:37:47,206] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt. + 7: [2023-05-10 12:37:47,206] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt... +12: [2023-05-10 12:37:47,206] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. + 7: [2023-05-10 12:37:47,206] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt... +22: [2023-05-10 12:37:47,206] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +28: [2023-05-10 12:37:47,207] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +12: [2023-05-10 12:37:47,207] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +12: [2023-05-10 12:37:47,207] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. + 8: [2023-05-10 12:37:47,206] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt. +30: [2023-05-10 12:37:47,207] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +28: [2023-05-10 12:37:47,207] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +30: [2023-05-10 12:37:47,209] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +30: [2023-05-10 12:37:47,210] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. + 6: [2023-05-10 12:37:47,212] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +12: [2023-05-10 12:37:47,212] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. + 6: [2023-05-10 12:37:47,215] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... + 6: [2023-05-10 12:37:47,215] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... + 8: [2023-05-10 12:37:47,215] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... + 8: [2023-05-10 12:37:47,216] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... + 6: [2023-05-10 12:37:47,216] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +12: [2023-05-10 12:37:47,216] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... + 8: [2023-05-10 12:37:47,216] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... + 8: [2023-05-10 12:37:47,216] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... + 6: [2023-05-10 12:37:47,216] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +30: [2023-05-10 12:37:47,217] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +28: [2023-05-10 12:37:47,217] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +28: [2023-05-10 12:37:47,217] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +12: [2023-05-10 12:37:47,217] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +12: [2023-05-10 12:37:47,217] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... + 6: [2023-05-10 12:37:47,217] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +30: [2023-05-10 12:37:47,219] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +22: [2023-05-10 12:37:47,220] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +12: [2023-05-10 12:37:47,222] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... + 6: [2023-05-10 12:37:47,222] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... + 6: [2023-05-10 12:37:47,227] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... + 1: [2023-05-10 12:37:47,228] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt. + 1: [2023-05-10 12:37:47,228] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt. + 1: [2023-05-10 12:37:47,228] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt. + 1: [2023-05-10 12:37:47,228] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt. + 9: [2023-05-10 12:37:47,229] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. + 9: [2023-05-10 12:37:47,229] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. + 9: [2023-05-10 12:37:47,229] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... + 9: [2023-05-10 12:37:47,229] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... + 9: [2023-05-10 12:37:47,229] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. + 9: [2023-05-10 12:37:47,229] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. + 9: [2023-05-10 12:37:47,229] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... + 9: [2023-05-10 12:37:47,229] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... + 8: [2023-05-10 12:37:47,231] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. + 8: [2023-05-10 12:37:47,231] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. + 8: [2023-05-10 12:37:47,231] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt... + 8: [2023-05-10 12:37:47,231] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt... + 8: [2023-05-10 12:37:47,232] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. + 8: [2023-05-10 12:37:47,232] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. + 8: [2023-05-10 12:37:47,232] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt... + 8: [2023-05-10 12:37:47,232] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt... +22: [2023-05-10 12:37:47,234] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... + 6: [2023-05-10 12:37:47,235] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. + 6: [2023-05-10 12:37:47,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. + 6: [2023-05-10 12:37:47,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +28: [2023-05-10 12:37:47,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt. +28: [2023-05-10 12:37:47,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt. +28: [2023-05-10 12:37:47,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt. +28: [2023-05-10 12:37:47,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt. + 6: [2023-05-10 12:37:47,236] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt... + 6: [2023-05-10 12:37:47,236] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt... + 6: [2023-05-10 12:37:47,236] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt... + 6: [2023-05-10 12:37:47,237] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. + 6: [2023-05-10 12:37:47,238] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt... + 7: [2023-05-10 12:37:47,238] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. + 7: [2023-05-10 12:37:47,239] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... + 7: [2023-05-10 12:37:47,239] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. + 7: [2023-05-10 12:37:47,239] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. + 7: [2023-05-10 12:37:47,239] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... + 7: [2023-05-10 12:37:47,239] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... + 7: [2023-05-10 12:37:47,239] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. + 1: [2023-05-10 12:37:47,240] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... + 1: [2023-05-10 12:37:47,240] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... + 1: [2023-05-10 12:37:47,240] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... + 1: [2023-05-10 12:37:47,240] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +13: [2023-05-10 12:37:47,240] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +13: [2023-05-10 12:37:47,240] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... + 7: [2023-05-10 12:37:47,241] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... + 9: [2023-05-10 12:37:47,241] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. + 0: [2023-05-10 12:37:47,241] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. + 0: [2023-05-10 12:37:47,241] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. + 0: [2023-05-10 12:37:47,241] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. + 0: [2023-05-10 12:37:47,241] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... + 0: [2023-05-10 12:37:47,241] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... + 0: [2023-05-10 12:37:47,241] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... + 0: [2023-05-10 12:37:47,241] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. + 9: [2023-05-10 12:37:47,241] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +13: [2023-05-10 12:37:47,241] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +13: [2023-05-10 12:37:47,241] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +13: [2023-05-10 12:37:47,241] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +13: [2023-05-10 12:37:47,241] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +13: [2023-05-10 12:37:47,241] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +13: [2023-05-10 12:37:47,241] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... + 9: [2023-05-10 12:37:47,243] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. + 0: [2023-05-10 12:37:47,244] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... + 9: [2023-05-10 12:37:47,244] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +28: [2023-05-10 12:37:47,245] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... + 1: [2023-05-10 12:37:47,247] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. + 1: [2023-05-10 12:37:47,247] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... + 1: [2023-05-10 12:37:47,247] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +28: [2023-05-10 12:37:47,248] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +28: [2023-05-10 12:37:47,248] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +28: [2023-05-10 12:37:47,248] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... + 1: [2023-05-10 12:37:47,248] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. + 1: [2023-05-10 12:37:47,248] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. + 1: [2023-05-10 12:37:47,249] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... + 1: [2023-05-10 12:37:47,249] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... + 1: [2023-05-10 12:37:47,250] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... + 7: [2023-05-10 12:37:47,250] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. + 9: [2023-05-10 12:37:47,251] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... + 9: [2023-05-10 12:37:47,252] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +13: [2023-05-10 12:37:47,253] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. + 9: [2023-05-10 12:37:47,254] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... + 9: [2023-05-10 12:37:47,255] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +16: [2023-05-10 12:37:47,255] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +16: [2023-05-10 12:37:47,255] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +16: [2023-05-10 12:37:47,255] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +16: [2023-05-10 12:37:47,255] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +16: [2023-05-10 12:37:47,255] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... + 8: [2023-05-10 12:37:47,256] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +16: [2023-05-10 12:37:47,256] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. + 8: [2023-05-10 12:37:47,256] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. + 8: [2023-05-10 12:37:47,256] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +16: [2023-05-10 12:37:47,256] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... + 8: [2023-05-10 12:37:47,256] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... + 1: [2023-05-10 12:37:47,256] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +16: [2023-05-10 12:37:47,257] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +28: [2023-05-10 12:37:47,256] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. + 1: [2023-05-10 12:37:47,257] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt... +28: [2023-05-10 12:37:47,257] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt... + 8: [2023-05-10 12:37:47,257] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. + 8: [2023-05-10 12:37:47,257] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. + 7: [2023-05-10 12:37:47,258] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. + 7: [2023-05-10 12:37:47,258] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. + 8: [2023-05-10 12:37:47,259] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... + 8: [2023-05-10 12:37:47,259] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... + 1: [2023-05-10 12:37:47,260] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. + 1: [2023-05-10 12:37:47,260] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. + 1: [2023-05-10 12:37:47,260] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt... +23: [2023-05-10 12:37:47,260] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +23: [2023-05-10 12:37:47,260] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +23: [2023-05-10 12:37:47,260] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +23: [2023-05-10 12:37:47,260] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +23: [2023-05-10 12:37:47,261] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +23: [2023-05-10 12:37:47,261] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. + 7: [2023-05-10 12:37:47,261] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +23: [2023-05-10 12:37:47,261] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +19: [2023-05-10 12:37:47,261] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +19: [2023-05-10 12:37:47,261] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... + 1: [2023-05-10 12:37:47,261] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +19: [2023-05-10 12:37:47,261] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. + 1: [2023-05-10 12:37:47,261] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt... +19: [2023-05-10 12:37:47,261] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +19: [2023-05-10 12:37:47,261] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +19: [2023-05-10 12:37:47,262] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +23: [2023-05-10 12:37:47,262] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +28: [2023-05-10 12:37:47,261] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +28: [2023-05-10 12:37:47,262] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt... +13: [2023-05-10 12:37:47,262] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +19: [2023-05-10 12:37:47,263] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +19: [2023-05-10 12:37:47,263] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... + 0: [2023-05-10 12:37:47,263] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. + 0: [2023-05-10 12:37:47,263] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. + 0: [2023-05-10 12:37:47,263] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +13: [2023-05-10 12:37:47,263] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +13: [2023-05-10 12:37:47,263] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +13: [2023-05-10 12:37:47,263] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +26: [2023-05-10 12:37:47,264] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +26: [2023-05-10 12:37:47,264] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +18: [2023-05-10 12:37:47,264] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +18: [2023-05-10 12:37:47,264] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +18: [2023-05-10 12:37:47,264] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +26: [2023-05-10 12:37:47,264] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +18: [2023-05-10 12:37:47,264] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +18: [2023-05-10 12:37:47,264] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +18: [2023-05-10 12:37:47,264] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +26: [2023-05-10 12:37:47,264] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +18: [2023-05-10 12:37:47,264] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +18: [2023-05-10 12:37:47,264] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +26: [2023-05-10 12:37:47,264] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +26: [2023-05-10 12:37:47,264] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +26: [2023-05-10 12:37:47,265] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +26: [2023-05-10 12:37:47,265] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... + 1: [2023-05-10 12:37:47,266] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +28: [2023-05-10 12:37:47,267] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +28: [2023-05-10 12:37:47,267] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt... + 7: [2023-05-10 12:37:47,268] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... + 7: [2023-05-10 12:37:47,268] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +16: [2023-05-10 12:37:47,270] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +16: [2023-05-10 12:37:47,271] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +16: [2023-05-10 12:37:47,271] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. + 1: [2023-05-10 12:37:47,271] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +28: [2023-05-10 12:37:47,271] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +19: [2023-05-10 12:37:47,272] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +23: [2023-05-10 12:37:47,272] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. + 7: [2023-05-10 12:37:47,272] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +28: [2023-05-10 12:37:47,273] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt... +23: [2023-05-10 12:37:47,273] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. + 8: [2023-05-10 12:37:47,273] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. + 8: [2023-05-10 12:37:47,273] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. + 1: [2023-05-10 12:37:47,274] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +19: [2023-05-10 12:37:47,274] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +13: [2023-05-10 12:37:47,275] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... + 1: [2023-05-10 12:37:47,275] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... + 1: [2023-05-10 12:37:47,276] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt... +13: [2023-05-10 12:37:47,276] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +13: [2023-05-10 12:37:47,276] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +30: [2023-05-10 12:37:47,276] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt. +30: [2023-05-10 12:37:47,276] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt. + 0: [2023-05-10 12:37:47,276] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... + 0: [2023-05-10 12:37:47,276] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... + 0: [2023-05-10 12:37:47,276] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +18: [2023-05-10 12:37:47,277] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt. +18: [2023-05-10 12:37:47,277] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt. +26: [2023-05-10 12:37:47,276] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +30: [2023-05-10 12:37:47,277] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt. +26: [2023-05-10 12:37:47,277] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +23: [2023-05-10 12:37:47,277] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +30: [2023-05-10 12:37:47,278] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt. +19: [2023-05-10 12:37:47,279] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +26: [2023-05-10 12:37:47,280] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +26: [2023-05-10 12:37:47,280] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +16: [2023-05-10 12:37:47,280] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... + 7: [2023-05-10 12:37:47,280] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +19: [2023-05-10 12:37:47,280] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +16: [2023-05-10 12:37:47,281] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. + 1: [2023-05-10 12:37:47,281] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +16: [2023-05-10 12:37:47,281] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +16: [2023-05-10 12:37:47,282] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +23: [2023-05-10 12:37:47,282] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +23: [2023-05-10 12:37:47,282] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... + 0: [2023-05-10 12:37:47,283] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt. +18: [2023-05-10 12:37:47,282] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt. + 0: [2023-05-10 12:37:47,283] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt. + 0: [2023-05-10 12:37:47,283] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt. + 0: [2023-05-10 12:37:47,283] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt. + 8: [2023-05-10 12:37:47,283] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... + 8: [2023-05-10 12:37:47,283] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +18: [2023-05-10 12:37:47,283] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt. +19: [2023-05-10 12:37:47,284] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... + 2: [2023-05-10 12:37:47,284] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt. + 2: [2023-05-10 12:37:47,284] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt. +26: [2023-05-10 12:37:47,285] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +18: [2023-05-10 12:37:47,285] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... + 1: [2023-05-10 12:37:47,285] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. + 0: [2023-05-10 12:37:47,285] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. + 2: [2023-05-10 12:37:47,285] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt. + 8: [2023-05-10 12:37:47,285] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +31: [2023-05-10 12:37:47,285] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt. +31: [2023-05-10 12:37:47,285] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt. +30: [2023-05-10 12:37:47,286] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +31: [2023-05-10 12:37:47,286] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt. + 2: [2023-05-10 12:37:47,286] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt. +30: [2023-05-10 12:37:47,286] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +31: [2023-05-10 12:37:47,286] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt. +18: [2023-05-10 12:37:47,286] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +23: [2023-05-10 12:37:47,286] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +30: [2023-05-10 12:37:47,286] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +26: [2023-05-10 12:37:47,286] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +14: [2023-05-10 12:37:47,286] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt. +14: [2023-05-10 12:37:47,287] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt. +14: [2023-05-10 12:37:47,287] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt. +14: [2023-05-10 12:37:47,287] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt. +30: [2023-05-10 12:37:47,287] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +17: [2023-05-10 12:37:47,287] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt. +17: [2023-05-10 12:37:47,287] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt. +17: [2023-05-10 12:37:47,287] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt. +15: [2023-05-10 12:37:47,287] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt. +15: [2023-05-10 12:37:47,288] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt. +15: [2023-05-10 12:37:47,288] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt. +15: [2023-05-10 12:37:47,288] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt. +17: [2023-05-10 12:37:47,288] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt. +16: [2023-05-10 12:37:47,289] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +23: [2023-05-10 12:37:47,289] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +19: [2023-05-10 12:37:47,289] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... + 1: [2023-05-10 12:37:47,290] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +27: [2023-05-10 12:37:47,290] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt. +27: [2023-05-10 12:37:47,290] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt. +27: [2023-05-10 12:37:47,290] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt. +19: [2023-05-10 12:37:47,290] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +27: [2023-05-10 12:37:47,290] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt. +26: [2023-05-10 12:37:47,291] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +26: [2023-05-10 12:37:47,291] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +11: [2023-05-10 12:37:47,291] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt. +11: [2023-05-10 12:37:47,292] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt. +11: [2023-05-10 12:37:47,292] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt. +11: [2023-05-10 12:37:47,292] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt. + 8: [2023-05-10 12:37:47,292] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +18: [2023-05-10 12:37:47,293] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +18: [2023-05-10 12:37:47,293] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +18: [2023-05-10 12:37:47,293] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +18: [2023-05-10 12:37:47,293] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. + 2: [2023-05-10 12:37:47,294] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... + 8: [2023-05-10 12:37:47,294] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... + 2: [2023-05-10 12:37:47,294] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... + 1: [2023-05-10 12:37:47,294] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +25: [2023-05-10 12:37:47,294] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt. +25: [2023-05-10 12:37:47,294] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt. +25: [2023-05-10 12:37:47,294] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt. + 0: [2023-05-10 12:37:47,295] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +25: [2023-05-10 12:37:47,295] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt. +16: [2023-05-10 12:37:47,295] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt. +16: [2023-05-10 12:37:47,295] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt. +16: [2023-05-10 12:37:47,295] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt. + 2: [2023-05-10 12:37:47,295] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... + 2: [2023-05-10 12:37:47,295] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +16: [2023-05-10 12:37:47,295] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt. +31: [2023-05-10 12:37:47,295] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... + 0: [2023-05-10 12:37:47,295] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +31: [2023-05-10 12:37:47,296] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... + 0: [2023-05-10 12:37:47,296] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... + 0: [2023-05-10 12:37:47,296] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... + 4: [2023-05-10 12:37:47,296] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt. + 4: [2023-05-10 12:37:47,296] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt. +31: [2023-05-10 12:37:47,296] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... + 4: [2023-05-10 12:37:47,296] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt. +12: [2023-05-10 12:37:47,296] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt. + 4: [2023-05-10 12:37:47,296] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt. +31: [2023-05-10 12:37:47,296] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... + 0: [2023-05-10 12:37:47,297] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +18: [2023-05-10 12:37:47,297] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +12: [2023-05-10 12:37:47,297] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt. +14: [2023-05-10 12:37:47,297] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... + 9: [2023-05-10 12:37:47,297] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt. +20: [2023-05-10 12:37:47,297] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt. + 9: [2023-05-10 12:37:47,297] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt. +20: [2023-05-10 12:37:47,297] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt. +20: [2023-05-10 12:37:47,297] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt. +21: [2023-05-10 12:37:47,298] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +15: [2023-05-10 12:37:47,298] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +21: [2023-05-10 12:37:47,298] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +12: [2023-05-10 12:37:47,298] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt. +21: [2023-05-10 12:37:47,298] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +21: [2023-05-10 12:37:47,298] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +20: [2023-05-10 12:37:47,298] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt. +21: [2023-05-10 12:37:47,298] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... + 9: [2023-05-10 12:37:47,298] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt. +21: [2023-05-10 12:37:47,298] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +21: [2023-05-10 12:37:47,298] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +17: [2023-05-10 12:37:47,298] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +21: [2023-05-10 12:37:47,298] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... + 9: [2023-05-10 12:37:47,298] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt. +15: [2023-05-10 12:37:47,298] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +19: [2023-05-10 12:37:47,298] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +12: [2023-05-10 12:37:47,298] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt. +17: [2023-05-10 12:37:47,298] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +23: [2023-05-10 12:37:47,298] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +15: [2023-05-10 12:37:47,299] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +27: [2023-05-10 12:37:47,299] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... + 5: [2023-05-10 12:37:47,299] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt. +17: [2023-05-10 12:37:47,299] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +17: [2023-05-10 12:37:47,299] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. + 5: [2023-05-10 12:37:47,299] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt. + 5: [2023-05-10 12:37:47,299] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt. +17: [2023-05-10 12:37:47,299] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +17: [2023-05-10 12:37:47,299] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +17: [2023-05-10 12:37:47,299] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +17: [2023-05-10 12:37:47,299] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +17: [2023-05-10 12:37:47,299] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +17: [2023-05-10 12:37:47,299] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +13: [2023-05-10 12:37:47,300] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt. +13: [2023-05-10 12:37:47,300] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt. +13: [2023-05-10 12:37:47,300] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt. +17: [2023-05-10 12:37:47,300] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... + 5: [2023-05-10 12:37:47,300] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt. +13: [2023-05-10 12:37:47,300] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt. +27: [2023-05-10 12:37:47,300] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +14: [2023-05-10 12:37:47,300] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +14: [2023-05-10 12:37:47,300] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +14: [2023-05-10 12:37:47,300] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +14: [2023-05-10 12:37:47,300] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +14: [2023-05-10 12:37:47,300] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... + 5: [2023-05-10 12:37:47,300] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +14: [2023-05-10 12:37:47,300] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. + 3: [2023-05-10 12:37:47,300] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt. + 3: [2023-05-10 12:37:47,300] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt. + 5: [2023-05-10 12:37:47,300] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +14: [2023-05-10 12:37:47,300] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... + 5: [2023-05-10 12:37:47,300] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +25: [2023-05-10 12:37:47,300] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +25: [2023-05-10 12:37:47,301] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... + 8: [2023-05-10 12:37:47,301] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +11: [2023-05-10 12:37:47,301] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +25: [2023-05-10 12:37:47,301] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +25: [2023-05-10 12:37:47,301] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. + 5: [2023-05-10 12:37:47,301] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +25: [2023-05-10 12:37:47,301] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +15: [2023-05-10 12:37:47,301] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +25: [2023-05-10 12:37:47,301] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +25: [2023-05-10 12:37:47,301] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. + 5: [2023-05-10 12:37:47,301] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +27: [2023-05-10 12:37:47,301] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +17: [2023-05-10 12:37:47,301] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +25: [2023-05-10 12:37:47,301] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +18: [2023-05-10 12:37:47,301] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... + 5: [2023-05-10 12:37:47,302] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. + 5: [2023-05-10 12:37:47,302] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... + 5: [2023-05-10 12:37:47,302] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +27: [2023-05-10 12:37:47,302] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... + 3: [2023-05-10 12:37:47,302] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt. + 3: [2023-05-10 12:37:47,303] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt. +18: [2023-05-10 12:37:47,303] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +11: [2023-05-10 12:37:47,303] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +18: [2023-05-10 12:37:47,303] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt... +30: [2023-05-10 12:37:47,303] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +25: [2023-05-10 12:37:47,304] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +30: [2023-05-10 12:37:47,304] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt... +25: [2023-05-10 12:37:47,305] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +30: [2023-05-10 12:37:47,305] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +30: [2023-05-10 12:37:47,305] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt... +14: [2023-05-10 12:37:47,305] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +14: [2023-05-10 12:37:47,305] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +29: [2023-05-10 12:37:47,305] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt. +29: [2023-05-10 12:37:47,305] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt. +16: [2023-05-10 12:37:47,305] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +11: [2023-05-10 12:37:47,305] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +18: [2023-05-10 12:37:47,306] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +18: [2023-05-10 12:37:47,306] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt... + 4: [2023-05-10 12:37:47,306] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +11: [2023-05-10 12:37:47,306] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +25: [2023-05-10 12:37:47,306] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +29: [2023-05-10 12:37:47,306] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt. +29: [2023-05-10 12:37:47,306] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt. +16: [2023-05-10 12:37:47,306] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +16: [2023-05-10 12:37:47,306] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +16: [2023-05-10 12:37:47,307] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +24: [2023-05-10 12:37:47,306] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt. +12: [2023-05-10 12:37:47,307] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +20: [2023-05-10 12:37:47,307] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... + 4: [2023-05-10 12:37:47,307] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... + 4: [2023-05-10 12:37:47,307] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +12: [2023-05-10 12:37:47,307] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +14: [2023-05-10 12:37:47,307] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +14: [2023-05-10 12:37:47,307] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +24: [2023-05-10 12:37:47,307] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt. +24: [2023-05-10 12:37:47,307] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt. +20: [2023-05-10 12:37:47,307] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +12: [2023-05-10 12:37:47,307] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... + 4: [2023-05-10 12:37:47,307] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +24: [2023-05-10 12:37:47,307] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt. + 9: [2023-05-10 12:37:47,308] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +12: [2023-05-10 12:37:47,308] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +20: [2023-05-10 12:37:47,308] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +20: [2023-05-10 12:37:47,308] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... + 9: [2023-05-10 12:37:47,308] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +13: [2023-05-10 12:37:47,308] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... + 3: [2023-05-10 12:37:47,309] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +25: [2023-05-10 12:37:47,309] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... + 2: [2023-05-10 12:37:47,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +13: [2023-05-10 12:37:47,309] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... + 5: [2023-05-10 12:37:47,309] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +30: [2023-05-10 12:37:47,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +30: [2023-05-10 12:37:47,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +30: [2023-05-10 12:37:47,309] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt... +30: [2023-05-10 12:37:47,309] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt... + 2: [2023-05-10 12:37:47,310] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt... + 5: [2023-05-10 12:37:47,310] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +31: [2023-05-10 12:37:47,310] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +18: [2023-05-10 12:37:47,310] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +18: [2023-05-10 12:37:47,310] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +18: [2023-05-10 12:37:47,310] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... + 9: [2023-05-10 12:37:47,311] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +18: [2023-05-10 12:37:47,311] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +27: [2023-05-10 12:37:47,311] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. + 2: [2023-05-10 12:37:47,311] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. + 2: [2023-05-10 12:37:47,311] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. + 2: [2023-05-10 12:37:47,311] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt... +13: [2023-05-10 12:37:47,311] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +31: [2023-05-10 12:37:47,311] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt... + 2: [2023-05-10 12:37:47,311] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt... +17: [2023-05-10 12:37:47,310] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. + 3: [2023-05-10 12:37:47,311] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +27: [2023-05-10 12:37:47,311] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt... + 9: [2023-05-10 12:37:47,311] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +13: [2023-05-10 12:37:47,311] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +21: [2023-05-10 12:37:47,311] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. + 3: [2023-05-10 12:37:47,312] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... + 5: [2023-05-10 12:37:47,312] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +21: [2023-05-10 12:37:47,312] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. + 3: [2023-05-10 12:37:47,312] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +11: [2023-05-10 12:37:47,313] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +11: [2023-05-10 12:37:47,313] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt... +21: [2023-05-10 12:37:47,314] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +21: [2023-05-10 12:37:47,314] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. + 5: [2023-05-10 12:37:47,314] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +27: [2023-05-10 12:37:47,314] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +27: [2023-05-10 12:37:47,314] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt... +15: [2023-05-10 12:37:47,314] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +11: [2023-05-10 12:37:47,315] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +29: [2023-05-10 12:37:47,315] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +11: [2023-05-10 12:37:47,315] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt... +25: [2023-05-10 12:37:47,315] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +29: [2023-05-10 12:37:47,315] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +29: [2023-05-10 12:37:47,315] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... + 2: [2023-05-10 12:37:47,315] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. + 2: [2023-05-10 12:37:47,315] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt... +14: [2023-05-10 12:37:47,315] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +31: [2023-05-10 12:37:47,316] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +31: [2023-05-10 12:37:47,316] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt... +29: [2023-05-10 12:37:47,316] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +15: [2023-05-10 12:37:47,316] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +15: [2023-05-10 12:37:47,316] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +15: [2023-05-10 12:37:47,316] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt... +15: [2023-05-10 12:37:47,316] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt... +14: [2023-05-10 12:37:47,316] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt... +15: [2023-05-10 12:37:47,316] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt... +24: [2023-05-10 12:37:47,316] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +31: [2023-05-10 12:37:47,316] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +14: [2023-05-10 12:37:47,316] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +31: [2023-05-10 12:37:47,318] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt... + 5: [2023-05-10 12:37:47,317] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +24: [2023-05-10 12:37:47,318] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +20: [2023-05-10 12:37:47,318] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +24: [2023-05-10 12:37:47,318] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +20: [2023-05-10 12:37:47,318] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt... +24: [2023-05-10 12:37:47,318] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +14: [2023-05-10 12:37:47,319] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +20: [2023-05-10 12:37:47,319] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +18: [2023-05-10 12:37:47,319] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +20: [2023-05-10 12:37:47,319] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt... + 0: [2023-05-10 12:37:47,319] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +18: [2023-05-10 12:37:47,319] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt... +12: [2023-05-10 12:37:47,319] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +12: [2023-05-10 12:37:47,320] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt... + 0: [2023-05-10 12:37:47,320] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt... +12: [2023-05-10 12:37:47,320] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +12: [2023-05-10 12:37:47,320] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt... +14: [2023-05-10 12:37:47,320] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +14: [2023-05-10 12:37:47,320] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt... + 4: [2023-05-10 12:37:47,320] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +17: [2023-05-10 12:37:47,320] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +17: [2023-05-10 12:37:47,320] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +31: [2023-05-10 12:37:47,320] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +31: [2023-05-10 12:37:47,321] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt... + 4: [2023-05-10 12:37:47,321] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt... +12: [2023-05-10 12:37:47,321] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +12: [2023-05-10 12:37:47,321] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt... +17: [2023-05-10 12:37:47,321] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt... +17: [2023-05-10 12:37:47,321] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt... + 0: [2023-05-10 12:37:47,322] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +25: [2023-05-10 12:37:47,321] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +20: [2023-05-10 12:37:47,322] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. + 4: [2023-05-10 12:37:47,322] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +20: [2023-05-10 12:37:47,322] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt... +25: [2023-05-10 12:37:47,322] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +25: [2023-05-10 12:37:47,322] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. + 4: [2023-05-10 12:37:47,322] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt... +17: [2023-05-10 12:37:47,322] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +13: [2023-05-10 12:37:47,321] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +25: [2023-05-10 12:37:47,322] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt... +13: [2023-05-10 12:37:47,322] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt... + 5: [2023-05-10 12:37:47,322] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. + 5: [2023-05-10 12:37:47,323] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt... + 9: [2023-05-10 12:37:47,322] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +12: [2023-05-10 12:37:47,323] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +21: [2023-05-10 12:37:47,323] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt. + 0: [2023-05-10 12:37:47,323] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt... + 9: [2023-05-10 12:37:47,323] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt... +11: [2023-05-10 12:37:47,324] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +11: [2023-05-10 12:37:47,324] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt... +27: [2023-05-10 12:37:47,324] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +21: [2023-05-10 12:37:47,324] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt. +21: [2023-05-10 12:37:47,324] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt. +14: [2023-05-10 12:37:47,324] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +25: [2023-05-10 12:37:47,324] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +14: [2023-05-10 12:37:47,324] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt... +17: [2023-05-10 12:37:47,324] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +12: [2023-05-10 12:37:47,324] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt... + 3: [2023-05-10 12:37:47,325] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +16: [2023-05-10 12:37:47,325] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +27: [2023-05-10 12:37:47,325] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt... +13: [2023-05-10 12:37:47,325] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +17: [2023-05-10 12:37:47,325] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. + 3: [2023-05-10 12:37:47,325] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt... +13: [2023-05-10 12:37:47,325] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt... +16: [2023-05-10 12:37:47,325] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt... +22: [2023-05-10 12:37:47,325] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt. +22: [2023-05-10 12:37:47,325] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt. +22: [2023-05-10 12:37:47,325] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt. +27: [2023-05-10 12:37:47,326] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. + 0: [2023-05-10 12:37:47,326] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. + 5: [2023-05-10 12:37:47,326] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +21: [2023-05-10 12:37:47,326] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt. +21: [2023-05-10 12:37:47,326] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +25: [2023-05-10 12:37:47,326] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +15: [2023-05-10 12:37:47,327] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +21: [2023-05-10 12:37:47,327] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... + 4: [2023-05-10 12:37:47,327] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +27: [2023-05-10 12:37:47,327] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt... +20: [2023-05-10 12:37:47,327] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +22: [2023-05-10 12:37:47,327] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt. +20: [2023-05-10 12:37:47,327] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt... +25: [2023-05-10 12:37:47,327] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. + 0: [2023-05-10 12:37:47,327] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt... + 3: [2023-05-10 12:37:47,327] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. + 3: [2023-05-10 12:37:47,327] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt... +15: [2023-05-10 12:37:47,328] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt... +24: [2023-05-10 12:37:47,328] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +29: [2023-05-10 12:37:47,328] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. + 4: [2023-05-10 12:37:47,328] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt... +16: [2023-05-10 12:37:47,329] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +16: [2023-05-10 12:37:47,329] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. + 0: [2023-05-10 12:37:47,329] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +14: [2023-05-10 12:37:47,329] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +25: [2023-05-10 12:37:47,329] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt... +17: [2023-05-10 12:37:47,329] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +11: [2023-05-10 12:37:47,329] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +17: [2023-05-10 12:37:47,329] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt... + 9: [2023-05-10 12:37:47,329] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +21: [2023-05-10 12:37:47,329] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +29: [2023-05-10 12:37:47,329] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt... + 9: [2023-05-10 12:37:47,329] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt... +24: [2023-05-10 12:37:47,329] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt... +23: [2023-05-10 12:37:47,329] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt. +23: [2023-05-10 12:37:47,329] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt. +23: [2023-05-10 12:37:47,329] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt. + 5: [2023-05-10 12:37:47,330] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +23: [2023-05-10 12:37:47,330] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt. + 5: [2023-05-10 12:37:47,330] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt... +25: [2023-05-10 12:37:47,330] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +25: [2023-05-10 12:37:47,330] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt... +16: [2023-05-10 12:37:47,330] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt... + 3: [2023-05-10 12:37:47,330] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +11: [2023-05-10 12:37:47,330] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt... +16: [2023-05-10 12:37:47,330] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt... + 3: [2023-05-10 12:37:47,330] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt... +21: [2023-05-10 12:37:47,331] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +16: [2023-05-10 12:37:47,331] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. + 0: [2023-05-10 12:37:47,331] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt... +13: [2023-05-10 12:37:47,331] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. + 9: [2023-05-10 12:37:47,331] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +13: [2023-05-10 12:37:47,331] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt... + 9: [2023-05-10 12:37:47,331] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt... +14: [2023-05-10 12:37:47,331] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +26: [2023-05-10 12:37:47,331] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt. +14: [2023-05-10 12:37:47,331] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +26: [2023-05-10 12:37:47,331] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt. +14: [2023-05-10 12:37:47,332] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt... +26: [2023-05-10 12:37:47,331] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt. +26: [2023-05-10 12:37:47,332] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt. +25: [2023-05-10 12:37:47,332] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +16: [2023-05-10 12:37:47,332] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt... +29: [2023-05-10 12:37:47,332] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +29: [2023-05-10 12:37:47,332] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +29: [2023-05-10 12:37:47,332] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt... +29: [2023-05-10 12:37:47,332] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt... +17: [2023-05-10 12:37:47,333] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +25: [2023-05-10 12:37:47,333] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +21: [2023-05-10 12:37:47,333] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... + 4: [2023-05-10 12:37:47,334] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. + 9: [2023-05-10 12:37:47,333] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. + 9: [2023-05-10 12:37:47,333] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt... +25: [2023-05-10 12:37:47,334] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +25: [2023-05-10 12:37:47,334] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt... +17: [2023-05-10 12:37:47,334] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. + 7: [2023-05-10 12:37:47,334] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt. + 5: [2023-05-10 12:37:47,334] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +13: [2023-05-10 12:37:47,334] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. + 4: [2023-05-10 12:37:47,335] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt... +17: [2023-05-10 12:37:47,335] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... + 5: [2023-05-10 12:37:47,335] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. + 7: [2023-05-10 12:37:47,335] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt. +21: [2023-05-10 12:37:47,335] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +13: [2023-05-10 12:37:47,336] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt... +18: [2023-05-10 12:37:47,336] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +25: [2023-05-10 12:37:47,336] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +24: [2023-05-10 12:37:47,336] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +24: [2023-05-10 12:37:47,336] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt... +17: [2023-05-10 12:37:47,337] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt... +21: [2023-05-10 12:37:47,337] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +21: [2023-05-10 12:37:47,337] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... + 5: [2023-05-10 12:37:47,337] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +17: [2023-05-10 12:37:47,337] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... + 7: [2023-05-10 12:37:47,337] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt. +29: [2023-05-10 12:37:47,338] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +18: [2023-05-10 12:37:47,338] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt... +14: [2023-05-10 12:37:47,337] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +29: [2023-05-10 12:37:47,338] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt... + 7: [2023-05-10 12:37:47,338] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt. + 3: [2023-05-10 12:37:47,338] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +22: [2023-05-10 12:37:47,339] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +23: [2023-05-10 12:37:47,339] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... + 3: [2023-05-10 12:37:47,340] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt... +14: [2023-05-10 12:37:47,340] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +23: [2023-05-10 12:37:47,340] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +23: [2023-05-10 12:37:47,341] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +23: [2023-05-10 12:37:47,341] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +26: [2023-05-10 12:37:47,341] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... + 5: [2023-05-10 12:37:47,342] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. + 5: [2023-05-10 12:37:47,342] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt... +26: [2023-05-10 12:37:47,342] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +24: [2023-05-10 12:37:47,342] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +17: [2023-05-10 12:37:47,342] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +26: [2023-05-10 12:37:47,343] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +26: [2023-05-10 12:37:47,343] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +24: [2023-05-10 12:37:47,343] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt... + 7: [2023-05-10 12:37:47,344] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +22: [2023-05-10 12:37:47,345] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +22: [2023-05-10 12:37:47,345] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +22: [2023-05-10 12:37:47,345] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... + 7: [2023-05-10 12:37:47,345] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... + 5: [2023-05-10 12:37:47,346] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +21: [2023-05-10 12:37:47,347] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +14: [2023-05-10 12:37:47,347] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +21: [2023-05-10 12:37:47,347] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt... +14: [2023-05-10 12:37:47,349] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... + 5: [2023-05-10 12:37:47,349] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... + 7: [2023-05-10 12:37:47,348] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... + 7: [2023-05-10 12:37:47,348] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... + 5: [2023-05-10 12:37:47,350] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +19: [2023-05-10 12:37:47,351] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt. +19: [2023-05-10 12:37:47,351] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt. +24: [2023-05-10 12:37:47,348] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +24: [2023-05-10 12:37:47,351] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt... +21: [2023-05-10 12:37:47,350] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +21: [2023-05-10 12:37:47,351] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt... +23: [2023-05-10 12:37:47,354] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +26: [2023-05-10 12:37:47,353] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +26: [2023-05-10 12:37:47,354] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt... +19: [2023-05-10 12:37:47,354] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt. +19: [2023-05-10 12:37:47,355] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_31-model_01-model_states.pt. +23: [2023-05-10 12:37:47,355] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt... +22: [2023-05-10 12:37:47,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. + 5: [2023-05-10 12:37:47,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +22: [2023-05-10 12:37:47,357] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt... + 5: [2023-05-10 12:37:47,358] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt... +22: [2023-05-10 12:37:47,358] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. + 7: [2023-05-10 12:37:47,358] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +23: [2023-05-10 12:37:47,359] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +23: [2023-05-10 12:37:47,359] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +23: [2023-05-10 12:37:47,359] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt... +23: [2023-05-10 12:37:47,359] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt... +26: [2023-05-10 12:37:47,359] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +26: [2023-05-10 12:37:47,359] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt... + 7: [2023-05-10 12:37:47,359] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt... + 7: [2023-05-10 12:37:47,360] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. + 7: [2023-05-10 12:37:47,360] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt... +26: [2023-05-10 12:37:47,360] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +26: [2023-05-10 12:37:47,360] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +26: [2023-05-10 12:37:47,360] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt... +26: [2023-05-10 12:37:47,360] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt... +19: [2023-05-10 12:37:47,361] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... + 8: [2023-05-10 12:37:47,361] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt. + 8: [2023-05-10 12:37:47,361] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt. + 8: [2023-05-10 12:37:47,361] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt. + 7: [2023-05-10 12:37:47,361] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. + 7: [2023-05-10 12:37:47,361] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt... +19: [2023-05-10 12:37:47,361] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +22: [2023-05-10 12:37:47,361] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt... + 8: [2023-05-10 12:37:47,362] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt. + 7: [2023-05-10 12:37:47,363] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. + 7: [2023-05-10 12:37:47,363] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt... +19: [2023-05-10 12:37:47,364] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +23: [2023-05-10 12:37:47,365] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +19: [2023-05-10 12:37:47,365] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt... +21: [2023-05-10 12:37:47,365] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +21: [2023-05-10 12:37:47,365] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +23: [2023-05-10 12:37:47,366] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt... +21: [2023-05-10 12:37:47,367] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt... +21: [2023-05-10 12:37:47,368] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt... + 8: [2023-05-10 12:37:47,370] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... + 8: [2023-05-10 12:37:47,370] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... + 8: [2023-05-10 12:37:47,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... + 8: [2023-05-10 12:37:47,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +22: [2023-05-10 12:37:47,374] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +22: [2023-05-10 12:37:47,374] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +22: [2023-05-10 12:37:47,376] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt... +22: [2023-05-10 12:37:47,376] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt... +19: [2023-05-10 12:37:47,378] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +19: [2023-05-10 12:37:47,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt... +19: [2023-05-10 12:37:47,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +19: [2023-05-10 12:37:47,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt... +19: [2023-05-10 12:37:47,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +19: [2023-05-10 12:37:47,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt... + 8: [2023-05-10 12:37:47,384] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. + 8: [2023-05-10 12:37:47,384] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt... +19: [2023-05-10 12:37:47,385] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_00-model_states.pt. +19: [2023-05-10 12:37:47,386] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt... + 8: [2023-05-10 12:37:47,387] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. + 8: [2023-05-10 12:37:47,387] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. + 8: [2023-05-10 12:37:47,387] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt... + 8: [2023-05-10 12:37:47,387] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt... + 8: [2023-05-10 12:37:47,395] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. + 8: [2023-05-10 12:37:47,397] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt... + 2: [2023-05-10 12:37:47,447] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. + 2: [2023-05-10 12:37:47,447] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. + 2: [2023-05-10 12:37:47,447] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. + 2: [2023-05-10 12:37:47,447] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... + 2: [2023-05-10 12:37:47,447] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. + 2: [2023-05-10 12:37:47,447] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... + 2: [2023-05-10 12:37:47,448] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... + 2: [2023-05-10 12:37:47,448] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... + 2: [2023-05-10 12:37:47,462] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. + 2: [2023-05-10 12:37:47,462] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. + 2: [2023-05-10 12:37:47,471] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. + 2: [2023-05-10 12:37:47,474] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. + 2: [2023-05-10 12:37:47,474] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... + 2: [2023-05-10 12:37:47,474] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... + 2: [2023-05-10 12:37:47,481] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... + 2: [2023-05-10 12:37:47,483] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +10: [2023-05-10 12:37:47,485] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt. +10: [2023-05-10 12:37:47,485] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt. +10: [2023-05-10 12:37:47,487] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt. +10: [2023-05-10 12:37:47,487] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt. +10: [2023-05-10 12:37:47,496] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +10: [2023-05-10 12:37:47,496] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +10: [2023-05-10 12:37:47,497] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +10: [2023-05-10 12:37:47,499] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +10: [2023-05-10 12:37:47,511] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +10: [2023-05-10 12:37:47,511] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt... +10: [2023-05-10 12:37:47,511] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +10: [2023-05-10 12:37:47,511] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +10: [2023-05-10 12:37:47,511] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt... +10: [2023-05-10 12:37:47,511] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt... +10: [2023-05-10 12:37:47,516] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +10: [2023-05-10 12:37:47,516] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt... + 1: [2023-05-10 12:37:47,528] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt. + 1: [2023-05-10 12:37:47,528] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt. + 1: [2023-05-10 12:37:47,528] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt. + 1: [2023-05-10 12:37:47,528] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt. + 3: [2023-05-10 12:37:47,537] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt. + 3: [2023-05-10 12:37:47,537] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt. + 3: [2023-05-10 12:37:47,537] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt. + 1: [2023-05-10 12:37:47,538] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... + 1: [2023-05-10 12:37:47,538] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... + 1: [2023-05-10 12:37:47,538] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... + 3: [2023-05-10 12:37:47,538] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt. + 1: [2023-05-10 12:37:47,540] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... + 6: [2023-05-10 12:37:47,544] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt. + 6: [2023-05-10 12:37:47,544] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt. + 6: [2023-05-10 12:37:47,544] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt. + 6: [2023-05-10 12:37:47,545] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt. + 3: [2023-05-10 12:37:47,547] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... + 3: [2023-05-10 12:37:47,547] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... + 4: [2023-05-10 12:37:47,547] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +31: [2023-05-10 12:37:47,547] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. + 3: [2023-05-10 12:37:47,547] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... + 4: [2023-05-10 12:37:47,547] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... + 4: [2023-05-10 12:37:47,547] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. + 4: [2023-05-10 12:37:47,547] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. + 4: [2023-05-10 12:37:47,547] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. + 4: [2023-05-10 12:37:47,548] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... + 4: [2023-05-10 12:37:47,548] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... + 4: [2023-05-10 12:37:47,548] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +30: [2023-05-10 12:37:47,548] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +30: [2023-05-10 12:37:47,548] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +27: [2023-05-10 12:37:47,547] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +27: [2023-05-10 12:37:47,547] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +27: [2023-05-10 12:37:47,547] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +27: [2023-05-10 12:37:47,547] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +27: [2023-05-10 12:37:47,547] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +30: [2023-05-10 12:37:47,548] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +30: [2023-05-10 12:37:47,548] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +27: [2023-05-10 12:37:47,547] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +15: [2023-05-10 12:37:47,548] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +24: [2023-05-10 12:37:47,548] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +24: [2023-05-10 12:37:47,548] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +15: [2023-05-10 12:37:47,548] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +31: [2023-05-10 12:37:47,548] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +31: [2023-05-10 12:37:47,548] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +31: [2023-05-10 12:37:47,548] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +31: [2023-05-10 12:37:47,548] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +27: [2023-05-10 12:37:47,548] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +15: [2023-05-10 12:37:47,548] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +30: [2023-05-10 12:37:47,548] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +24: [2023-05-10 12:37:47,548] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +31: [2023-05-10 12:37:47,548] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +15: [2023-05-10 12:37:47,548] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +30: [2023-05-10 12:37:47,548] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +24: [2023-05-10 12:37:47,548] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +27: [2023-05-10 12:37:47,548] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +24: [2023-05-10 12:37:47,548] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +15: [2023-05-10 12:37:47,548] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +24: [2023-05-10 12:37:47,548] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +30: [2023-05-10 12:37:47,548] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +15: [2023-05-10 12:37:47,548] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +24: [2023-05-10 12:37:47,548] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +11: [2023-05-10 12:37:47,548] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +30: [2023-05-10 12:37:47,548] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +11: [2023-05-10 12:37:47,548] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +11: [2023-05-10 12:37:47,548] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +11: [2023-05-10 12:37:47,548] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. + 3: [2023-05-10 12:37:47,549] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. + 3: [2023-05-10 12:37:47,549] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. + 3: [2023-05-10 12:37:47,549] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... + 3: [2023-05-10 12:37:47,549] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +12: [2023-05-10 12:37:47,549] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +12: [2023-05-10 12:37:47,549] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. + 3: [2023-05-10 12:37:47,549] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +12: [2023-05-10 12:37:47,549] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... + 3: [2023-05-10 12:37:47,549] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +12: [2023-05-10 12:37:47,549] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... + 3: [2023-05-10 12:37:47,549] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +11: [2023-05-10 12:37:47,549] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +11: [2023-05-10 12:37:47,549] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +11: [2023-05-10 12:37:47,549] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +11: [2023-05-10 12:37:47,549] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +24: [2023-05-10 12:37:47,549] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +12: [2023-05-10 12:37:47,549] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +12: [2023-05-10 12:37:47,549] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +15: [2023-05-10 12:37:47,549] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... + 3: [2023-05-10 12:37:47,549] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +15: [2023-05-10 12:37:47,549] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +31: [2023-05-10 12:37:47,549] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +31: [2023-05-10 12:37:47,549] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... + 9: [2023-05-10 12:37:47,550] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. + 9: [2023-05-10 12:37:47,550] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. + 9: [2023-05-10 12:37:47,550] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. + 9: [2023-05-10 12:37:47,550] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... + 9: [2023-05-10 12:37:47,550] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... + 9: [2023-05-10 12:37:47,550] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +20: [2023-05-10 12:37:47,550] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +20: [2023-05-10 12:37:47,550] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +20: [2023-05-10 12:37:47,551] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +20: [2023-05-10 12:37:47,551] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +20: [2023-05-10 12:37:47,551] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +12: [2023-05-10 12:37:47,551] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +20: [2023-05-10 12:37:47,551] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +20: [2023-05-10 12:37:47,551] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... + 3: [2023-05-10 12:37:47,551] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +12: [2023-05-10 12:37:47,551] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... + 9: [2023-05-10 12:37:47,551] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... + 9: [2023-05-10 12:37:47,552] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +20: [2023-05-10 12:37:47,553] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +23: [2023-05-10 12:37:47,553] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt. +23: [2023-05-10 12:37:47,553] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt. + 6: [2023-05-10 12:37:47,553] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... + 6: [2023-05-10 12:37:47,554] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +23: [2023-05-10 12:37:47,553] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt. +23: [2023-05-10 12:37:47,554] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt. + 6: [2023-05-10 12:37:47,554] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... + 6: [2023-05-10 12:37:47,554] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +11: [2023-05-10 12:37:47,554] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt. +11: [2023-05-10 12:37:47,554] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt. +11: [2023-05-10 12:37:47,555] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt. +11: [2023-05-10 12:37:47,558] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt. +31: [2023-05-10 12:37:47,559] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +24: [2023-05-10 12:37:47,559] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. + 3: [2023-05-10 12:37:47,560] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +27: [2023-05-10 12:37:47,560] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +30: [2023-05-10 12:37:47,560] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +27: [2023-05-10 12:37:47,560] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. + 3: [2023-05-10 12:37:47,561] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt... +31: [2023-05-10 12:37:47,562] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +23: [2023-05-10 12:37:47,562] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +23: [2023-05-10 12:37:47,562] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +27: [2023-05-10 12:37:47,562] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +27: [2023-05-10 12:37:47,562] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +24: [2023-05-10 12:37:47,562] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +24: [2023-05-10 12:37:47,562] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +20: [2023-05-10 12:37:47,563] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +15: [2023-05-10 12:37:47,563] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. + 4: [2023-05-10 12:37:47,563] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +23: [2023-05-10 12:37:47,563] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +12: [2023-05-10 12:37:47,563] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +12: [2023-05-10 12:37:47,563] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +23: [2023-05-10 12:37:47,564] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +15: [2023-05-10 12:37:47,564] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt. +15: [2023-05-10 12:37:47,564] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt. +30: [2023-05-10 12:37:47,564] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. + 4: [2023-05-10 12:37:47,565] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. + 9: [2023-05-10 12:37:47,565] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. + 9: [2023-05-10 12:37:47,566] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +15: [2023-05-10 12:37:47,566] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt. +20: [2023-05-10 12:37:47,566] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +20: [2023-05-10 12:37:47,566] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. + 4: [2023-05-10 12:37:47,566] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. + 3: [2023-05-10 12:37:47,566] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +30: [2023-05-10 12:37:47,566] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. + 3: [2023-05-10 12:37:47,566] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt... +11: [2023-05-10 12:37:47,567] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +11: [2023-05-10 12:37:47,567] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +15: [2023-05-10 12:37:47,567] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +31: [2023-05-10 12:37:47,567] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +15: [2023-05-10 12:37:47,567] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +11: [2023-05-10 12:37:47,567] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +15: [2023-05-10 12:37:47,569] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt. +28: [2023-05-10 12:37:47,569] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +28: [2023-05-10 12:37:47,569] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. + 3: [2023-05-10 12:37:47,569] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +28: [2023-05-10 12:37:47,569] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +28: [2023-05-10 12:37:47,569] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... + 4: [2023-05-10 12:37:47,569] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +28: [2023-05-10 12:37:47,570] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +28: [2023-05-10 12:37:47,570] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +11: [2023-05-10 12:37:47,570] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +30: [2023-05-10 12:37:47,570] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +24: [2023-05-10 12:37:47,570] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt. +11: [2023-05-10 12:37:47,570] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +24: [2023-05-10 12:37:47,570] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt. +31: [2023-05-10 12:37:47,571] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +28: [2023-05-10 12:37:47,571] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +28: [2023-05-10 12:37:47,571] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... + 3: [2023-05-10 12:37:47,571] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. + 3: [2023-05-10 12:37:47,571] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. + 3: [2023-05-10 12:37:47,571] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +11: [2023-05-10 12:37:47,571] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. + 3: [2023-05-10 12:37:47,572] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt... +20: [2023-05-10 12:37:47,572] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +27: [2023-05-10 12:37:47,572] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +27: [2023-05-10 12:37:47,572] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +27: [2023-05-10 12:37:47,572] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +11: [2023-05-10 12:37:47,572] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +12: [2023-05-10 12:37:47,572] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +31: [2023-05-10 12:37:47,572] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +11: [2023-05-10 12:37:47,573] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +30: [2023-05-10 12:37:47,573] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +15: [2023-05-10 12:37:47,573] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +24: [2023-05-10 12:37:47,574] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt. + 9: [2023-05-10 12:37:47,574] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +12: [2023-05-10 12:37:47,574] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +15: [2023-05-10 12:37:47,574] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +24: [2023-05-10 12:37:47,574] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... + 4: [2023-05-10 12:37:47,574] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +24: [2023-05-10 12:37:47,574] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +24: [2023-05-10 12:37:47,574] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +15: [2023-05-10 12:37:47,575] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... + 9: [2023-05-10 12:37:47,575] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... + 9: [2023-05-10 12:37:47,575] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +12: [2023-05-10 12:37:47,575] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +27: [2023-05-10 12:37:47,575] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +20: [2023-05-10 12:37:47,575] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +24: [2023-05-10 12:37:47,575] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt. +31: [2023-05-10 12:37:47,576] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +20: [2023-05-10 12:37:47,576] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +30: [2023-05-10 12:37:47,576] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +22: [2023-05-10 12:37:47,576] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt. + 4: [2023-05-10 12:37:47,576] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +15: [2023-05-10 12:37:47,577] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +30: [2023-05-10 12:37:47,577] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... + 4: [2023-05-10 12:37:47,577] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... + 9: [2023-05-10 12:37:47,577] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +15: [2023-05-10 12:37:47,577] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +22: [2023-05-10 12:37:47,577] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +22: [2023-05-10 12:37:47,577] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +22: [2023-05-10 12:37:47,577] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +22: [2023-05-10 12:37:47,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... + 3: [2023-05-10 12:37:47,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +22: [2023-05-10 12:37:47,578] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt. +22: [2023-05-10 12:37:47,579] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +22: [2023-05-10 12:37:47,579] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +22: [2023-05-10 12:37:47,579] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt. +17: [2023-05-10 12:37:47,579] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt. +17: [2023-05-10 12:37:47,579] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt. +22: [2023-05-10 12:37:47,579] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +22: [2023-05-10 12:37:47,579] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt. + 4: [2023-05-10 12:37:47,579] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +12: [2023-05-10 12:37:47,579] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +17: [2023-05-10 12:37:47,579] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt. +17: [2023-05-10 12:37:47,580] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt. +15: [2023-05-10 12:37:47,580] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +24: [2023-05-10 12:37:47,580] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +15: [2023-05-10 12:37:47,581] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +31: [2023-05-10 12:37:47,581] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... + 3: [2023-05-10 12:37:47,581] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. + 3: [2023-05-10 12:37:47,581] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... + 3: [2023-05-10 12:37:47,581] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... + 8: [2023-05-10 12:37:47,581] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt. + 8: [2023-05-10 12:37:47,581] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt. +29: [2023-05-10 12:37:47,581] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt. +29: [2023-05-10 12:37:47,581] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt. +29: [2023-05-10 12:37:47,581] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt. + 8: [2023-05-10 12:37:47,581] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt. +20: [2023-05-10 12:37:47,581] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. + 7: [2023-05-10 12:37:47,582] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt. +29: [2023-05-10 12:37:47,582] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt. +30: [2023-05-10 12:37:47,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +11: [2023-05-10 12:37:47,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... + 8: [2023-05-10 12:37:47,582] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt. +24: [2023-05-10 12:37:47,582] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. + 7: [2023-05-10 12:37:47,582] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt. + 7: [2023-05-10 12:37:47,582] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt. +13: [2023-05-10 12:37:47,582] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. + 0: [2023-05-10 12:37:47,582] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt. +11: [2023-05-10 12:37:47,582] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +13: [2023-05-10 12:37:47,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... + 9: [2023-05-10 12:37:47,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +11: [2023-05-10 12:37:47,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... + 3: [2023-05-10 12:37:47,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt... +24: [2023-05-10 12:37:47,583] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +11: [2023-05-10 12:37:47,583] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... + 7: [2023-05-10 12:37:47,583] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt. + 0: [2023-05-10 12:37:47,583] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt. +13: [2023-05-10 12:37:47,583] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +13: [2023-05-10 12:37:47,583] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +13: [2023-05-10 12:37:47,583] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +11: [2023-05-10 12:37:47,583] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt... +13: [2023-05-10 12:37:47,583] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +15: [2023-05-10 12:37:47,584] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +22: [2023-05-10 12:37:47,584] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +12: [2023-05-10 12:37:47,584] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +31: [2023-05-10 12:37:47,584] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +12: [2023-05-10 12:37:47,585] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt. + 0: [2023-05-10 12:37:47,585] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt. + 9: [2023-05-10 12:37:47,585] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... + 0: [2023-05-10 12:37:47,585] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt. +12: [2023-05-10 12:37:47,585] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt. +13: [2023-05-10 12:37:47,585] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +24: [2023-05-10 12:37:47,585] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +13: [2023-05-10 12:37:47,585] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +30: [2023-05-10 12:37:47,585] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt. +30: [2023-05-10 12:37:47,585] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt. +30: [2023-05-10 12:37:47,585] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt. +12: [2023-05-10 12:37:47,585] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt. +26: [2023-05-10 12:37:47,585] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt. +26: [2023-05-10 12:37:47,585] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt. +26: [2023-05-10 12:37:47,586] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt. +24: [2023-05-10 12:37:47,586] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +30: [2023-05-10 12:37:47,586] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt. +11: [2023-05-10 12:37:47,586] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +26: [2023-05-10 12:37:47,586] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt. +12: [2023-05-10 12:37:47,586] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt. +26: [2023-05-10 12:37:47,586] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +26: [2023-05-10 12:37:47,586] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +18: [2023-05-10 12:37:47,586] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt. +18: [2023-05-10 12:37:47,586] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt. +18: [2023-05-10 12:37:47,586] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt. +26: [2023-05-10 12:37:47,586] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +18: [2023-05-10 12:37:47,586] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt. +26: [2023-05-10 12:37:47,587] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +14: [2023-05-10 12:37:47,587] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt. +14: [2023-05-10 12:37:47,587] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt. +13: [2023-05-10 12:37:47,587] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt. +14: [2023-05-10 12:37:47,587] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt. +28: [2023-05-10 12:37:47,587] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +28: [2023-05-10 12:37:47,587] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +28: [2023-05-10 12:37:47,587] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt. +28: [2023-05-10 12:37:47,588] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt. +14: [2023-05-10 12:37:47,588] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt. +13: [2023-05-10 12:37:47,588] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt. +27: [2023-05-10 12:37:47,588] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt. +13: [2023-05-10 12:37:47,588] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt. +27: [2023-05-10 12:37:47,588] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt. +27: [2023-05-10 12:37:47,588] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt. +27: [2023-05-10 12:37:47,589] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt. +28: [2023-05-10 12:37:47,589] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt. +13: [2023-05-10 12:37:47,589] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt. + 9: [2023-05-10 12:37:47,589] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt. + 9: [2023-05-10 12:37:47,589] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt. + 9: [2023-05-10 12:37:47,589] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt. + 5: [2023-05-10 12:37:47,589] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt. +17: [2023-05-10 12:37:47,589] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... + 9: [2023-05-10 12:37:47,589] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt. + 5: [2023-05-10 12:37:47,590] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt. + 5: [2023-05-10 12:37:47,590] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt. +17: [2023-05-10 12:37:47,590] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... + 5: [2023-05-10 12:37:47,590] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt. +17: [2023-05-10 12:37:47,590] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +29: [2023-05-10 12:37:47,591] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +29: [2023-05-10 12:37:47,591] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +11: [2023-05-10 12:37:47,591] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +11: [2023-05-10 12:37:47,591] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt... +26: [2023-05-10 12:37:47,591] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +17: [2023-05-10 12:37:47,591] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +22: [2023-05-10 12:37:47,591] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +20: [2023-05-10 12:37:47,591] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +26: [2023-05-10 12:37:47,592] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... + 7: [2023-05-10 12:37:47,591] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +12: [2023-05-10 12:37:47,592] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +28: [2023-05-10 12:37:47,592] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +22: [2023-05-10 12:37:47,592] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +22: [2023-05-10 12:37:47,592] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +11: [2023-05-10 12:37:47,592] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +11: [2023-05-10 12:37:47,592] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt... + 3: [2023-05-10 12:37:47,593] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. + 8: [2023-05-10 12:37:47,593] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... + 7: [2023-05-10 12:37:47,593] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +22: [2023-05-10 12:37:47,593] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +28: [2023-05-10 12:37:47,593] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt. +15: [2023-05-10 12:37:47,593] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +11: [2023-05-10 12:37:47,593] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +22: [2023-05-10 12:37:47,593] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +11: [2023-05-10 12:37:47,593] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt... +29: [2023-05-10 12:37:47,593] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... + 7: [2023-05-10 12:37:47,593] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +29: [2023-05-10 12:37:47,593] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +26: [2023-05-10 12:37:47,594] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. + 7: [2023-05-10 12:37:47,594] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... + 0: [2023-05-10 12:37:47,595] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... + 0: [2023-05-10 12:37:47,595] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... + 0: [2023-05-10 12:37:47,595] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... + 0: [2023-05-10 12:37:47,595] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +30: [2023-05-10 12:37:47,595] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +15: [2023-05-10 12:37:47,595] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +15: [2023-05-10 12:37:47,595] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +15: [2023-05-10 12:37:47,595] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +15: [2023-05-10 12:37:47,595] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +30: [2023-05-10 12:37:47,595] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +30: [2023-05-10 12:37:47,595] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +18: [2023-05-10 12:37:47,595] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +18: [2023-05-10 12:37:47,595] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +30: [2023-05-10 12:37:47,596] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... + 8: [2023-05-10 12:37:47,596] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... + 8: [2023-05-10 12:37:47,596] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... + 8: [2023-05-10 12:37:47,596] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +26: [2023-05-10 12:37:47,596] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +31: [2023-05-10 12:37:47,596] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt. +18: [2023-05-10 12:37:47,596] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +18: [2023-05-10 12:37:47,596] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +31: [2023-05-10 12:37:47,596] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt. +31: [2023-05-10 12:37:47,596] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt. +26: [2023-05-10 12:37:47,596] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +24: [2023-05-10 12:37:47,596] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +14: [2023-05-10 12:37:47,596] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +15: [2023-05-10 12:37:47,597] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt... +15: [2023-05-10 12:37:47,597] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt... +15: [2023-05-10 12:37:47,597] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt... +15: [2023-05-10 12:37:47,597] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt... +22: [2023-05-10 12:37:47,597] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +14: [2023-05-10 12:37:47,597] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +14: [2023-05-10 12:37:47,597] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +27: [2023-05-10 12:37:47,597] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +31: [2023-05-10 12:37:47,597] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt. + 4: [2023-05-10 12:37:47,597] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt. + 4: [2023-05-10 12:37:47,597] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt. +13: [2023-05-10 12:37:47,597] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +14: [2023-05-10 12:37:47,597] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +27: [2023-05-10 12:37:47,598] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... + 2: [2023-05-10 12:37:47,598] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt. + 2: [2023-05-10 12:37:47,598] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt. +27: [2023-05-10 12:37:47,598] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +22: [2023-05-10 12:37:47,598] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +27: [2023-05-10 12:37:47,598] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +28: [2023-05-10 12:37:47,598] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... + 4: [2023-05-10 12:37:47,598] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt. +12: [2023-05-10 12:37:47,598] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +12: [2023-05-10 12:37:47,598] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +12: [2023-05-10 12:37:47,598] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +12: [2023-05-10 12:37:47,598] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +28: [2023-05-10 12:37:47,599] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... + 2: [2023-05-10 12:37:47,599] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt. +26: [2023-05-10 12:37:47,599] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... + 4: [2023-05-10 12:37:47,599] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt. +28: [2023-05-10 12:37:47,599] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +26: [2023-05-10 12:37:47,599] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +24: [2023-05-10 12:37:47,599] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +26: [2023-05-10 12:37:47,599] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... + 2: [2023-05-10 12:37:47,599] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt. +28: [2023-05-10 12:37:47,599] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +20: [2023-05-10 12:37:47,599] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt. +28: [2023-05-10 12:37:47,599] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +20: [2023-05-10 12:37:47,599] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt. +20: [2023-05-10 12:37:47,599] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt. +24: [2023-05-10 12:37:47,599] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt... +20: [2023-05-10 12:37:47,600] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt. + 9: [2023-05-10 12:37:47,600] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... + 5: [2023-05-10 12:37:47,600] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... + 9: [2023-05-10 12:37:47,600] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +26: [2023-05-10 12:37:47,600] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. + 9: [2023-05-10 12:37:47,601] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +13: [2023-05-10 12:37:47,601] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... + 9: [2023-05-10 12:37:47,601] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... + 5: [2023-05-10 12:37:47,601] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... + 3: [2023-05-10 12:37:47,601] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +24: [2023-05-10 12:37:47,602] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. + 5: [2023-05-10 12:37:47,602] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +24: [2023-05-10 12:37:47,602] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt... + 5: [2023-05-10 12:37:47,602] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +16: [2023-05-10 12:37:47,602] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt. +16: [2023-05-10 12:37:47,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt. +16: [2023-05-10 12:37:47,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt. +13: [2023-05-10 12:37:47,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +16: [2023-05-10 12:37:47,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt. +28: [2023-05-10 12:37:47,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +28: [2023-05-10 12:37:47,604] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +13: [2023-05-10 12:37:47,604] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +13: [2023-05-10 12:37:47,604] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +31: [2023-05-10 12:37:47,605] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +31: [2023-05-10 12:37:47,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +31: [2023-05-10 12:37:47,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +31: [2023-05-10 12:37:47,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +17: [2023-05-10 12:37:47,606] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +13: [2023-05-10 12:37:47,607] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +17: [2023-05-10 12:37:47,607] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +17: [2023-05-10 12:37:47,607] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. + 4: [2023-05-10 12:37:47,607] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +17: [2023-05-10 12:37:47,607] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt... +17: [2023-05-10 12:37:47,607] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt... +17: [2023-05-10 12:37:47,607] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt... +30: [2023-05-10 12:37:47,607] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +30: [2023-05-10 12:37:47,608] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt... + 4: [2023-05-10 12:37:47,608] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +13: [2023-05-10 12:37:47,608] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. + 2: [2023-05-10 12:37:47,608] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +24: [2023-05-10 12:37:47,608] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. + 4: [2023-05-10 12:37:47,608] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +24: [2023-05-10 12:37:47,608] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt... + 2: [2023-05-10 12:37:47,608] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... + 0: [2023-05-10 12:37:47,609] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +24: [2023-05-10 12:37:47,609] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. + 4: [2023-05-10 12:37:47,609] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +26: [2023-05-10 12:37:47,609] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +26: [2023-05-10 12:37:47,609] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. + 0: [2023-05-10 12:37:47,609] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt... + 2: [2023-05-10 12:37:47,610] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... + 2: [2023-05-10 12:37:47,610] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +24: [2023-05-10 12:37:47,610] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt... +12: [2023-05-10 12:37:47,610] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +18: [2023-05-10 12:37:47,610] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +18: [2023-05-10 12:37:47,610] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +20: [2023-05-10 12:37:47,611] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +12: [2023-05-10 12:37:47,611] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt... +18: [2023-05-10 12:37:47,611] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt... +18: [2023-05-10 12:37:47,611] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt... +18: [2023-05-10 12:37:47,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +18: [2023-05-10 12:37:47,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +18: [2023-05-10 12:37:47,611] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt... +18: [2023-05-10 12:37:47,611] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt... +12: [2023-05-10 12:37:47,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +14: [2023-05-10 12:37:47,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +12: [2023-05-10 12:37:47,611] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt... +22: [2023-05-10 12:37:47,611] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +14: [2023-05-10 12:37:47,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt... +28: [2023-05-10 12:37:47,612] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +22: [2023-05-10 12:37:47,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +22: [2023-05-10 12:37:47,612] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +27: [2023-05-10 12:37:47,612] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. + 0: [2023-05-10 12:37:47,612] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. + 0: [2023-05-10 12:37:47,613] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt... +22: [2023-05-10 12:37:47,612] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +22: [2023-05-10 12:37:47,613] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +16: [2023-05-10 12:37:47,613] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +16: [2023-05-10 12:37:47,613] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +28: [2023-05-10 12:37:47,613] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +14: [2023-05-10 12:37:47,613] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +27: [2023-05-10 12:37:47,613] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt... +14: [2023-05-10 12:37:47,613] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt... +22: [2023-05-10 12:37:47,613] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt... +22: [2023-05-10 12:37:47,613] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt... +22: [2023-05-10 12:37:47,613] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt... +26: [2023-05-10 12:37:47,613] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +28: [2023-05-10 12:37:47,613] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt... +14: [2023-05-10 12:37:47,613] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +22: [2023-05-10 12:37:47,613] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +14: [2023-05-10 12:37:47,613] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt... +20: [2023-05-10 12:37:47,614] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +20: [2023-05-10 12:37:47,614] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... + 0: [2023-05-10 12:37:47,614] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. + 0: [2023-05-10 12:37:47,614] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt... +20: [2023-05-10 12:37:47,614] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +30: [2023-05-10 12:37:47,614] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +30: [2023-05-10 12:37:47,614] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +30: [2023-05-10 12:37:47,614] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +30: [2023-05-10 12:37:47,614] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt... +30: [2023-05-10 12:37:47,614] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt... +30: [2023-05-10 12:37:47,614] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt... + 0: [2023-05-10 12:37:47,614] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. + 0: [2023-05-10 12:37:47,614] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt... +14: [2023-05-10 12:37:47,614] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +14: [2023-05-10 12:37:47,614] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt... +27: [2023-05-10 12:37:47,615] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +27: [2023-05-10 12:37:47,615] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +27: [2023-05-10 12:37:47,615] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt... +27: [2023-05-10 12:37:47,615] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt... +16: [2023-05-10 12:37:47,615] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +16: [2023-05-10 12:37:47,615] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +27: [2023-05-10 12:37:47,616] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +28: [2023-05-10 12:37:47,616] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +28: [2023-05-10 12:37:47,616] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt... +26: [2023-05-10 12:37:47,617] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt... +27: [2023-05-10 12:37:47,617] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt... + 9: [2023-05-10 12:37:47,617] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +22: [2023-05-10 12:37:47,617] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +22: [2023-05-10 12:37:47,617] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt... +26: [2023-05-10 12:37:47,617] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +13: [2023-05-10 12:37:47,618] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +17: [2023-05-10 12:37:47,618] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +28: [2023-05-10 12:37:47,618] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +28: [2023-05-10 12:37:47,618] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt... +26: [2023-05-10 12:37:47,618] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +13: [2023-05-10 12:37:47,618] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt... +31: [2023-05-10 12:37:47,618] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. + 9: [2023-05-10 12:37:47,619] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt... + 5: [2023-05-10 12:37:47,618] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +31: [2023-05-10 12:37:47,619] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt... + 5: [2023-05-10 12:37:47,619] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt... + 9: [2023-05-10 12:37:47,619] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. + 9: [2023-05-10 12:37:47,619] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. + 9: [2023-05-10 12:37:47,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt... +13: [2023-05-10 12:37:47,619] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... + 9: [2023-05-10 12:37:47,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt... +17: [2023-05-10 12:37:47,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt... +28: [2023-05-10 12:37:47,621] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... + 2: [2023-05-10 12:37:47,621] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. + 2: [2023-05-10 12:37:47,622] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt... +28: [2023-05-10 12:37:47,622] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +28: [2023-05-10 12:37:47,622] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt... + 2: [2023-05-10 12:37:47,622] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +12: [2023-05-10 12:37:47,622] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. + 2: [2023-05-10 12:37:47,622] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt... +31: [2023-05-10 12:37:47,622] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +31: [2023-05-10 12:37:47,622] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt... +12: [2023-05-10 12:37:47,623] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt... + 4: [2023-05-10 12:37:47,623] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +31: [2023-05-10 12:37:47,623] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. + 4: [2023-05-10 12:37:47,623] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt... +31: [2023-05-10 12:37:47,624] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt... +26: [2023-05-10 12:37:47,624] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +31: [2023-05-10 12:37:47,624] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +31: [2023-05-10 12:37:47,624] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt... + 5: [2023-05-10 12:37:47,624] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. + 5: [2023-05-10 12:37:47,624] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt... +22: [2023-05-10 12:37:47,624] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. + 5: [2023-05-10 12:37:47,624] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +25: [2023-05-10 12:37:47,625] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt. +25: [2023-05-10 12:37:47,625] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt. + 5: [2023-05-10 12:37:47,626] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt... +26: [2023-05-10 12:37:47,626] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt... +12: [2023-05-10 12:37:47,626] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +26: [2023-05-10 12:37:47,626] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +26: [2023-05-10 12:37:47,627] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt... + 4: [2023-05-10 12:37:47,626] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +26: [2023-05-10 12:37:47,627] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +25: [2023-05-10 12:37:47,627] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt. + 9: [2023-05-10 12:37:47,628] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +12: [2023-05-10 12:37:47,628] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt... +25: [2023-05-10 12:37:47,628] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt. + 4: [2023-05-10 12:37:47,628] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt... + 4: [2023-05-10 12:37:47,628] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +13: [2023-05-10 12:37:47,628] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +13: [2023-05-10 12:37:47,628] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. + 4: [2023-05-10 12:37:47,628] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt... +13: [2023-05-10 12:37:47,628] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt... +13: [2023-05-10 12:37:47,628] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. + 9: [2023-05-10 12:37:47,629] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt... +13: [2023-05-10 12:37:47,629] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt... +16: [2023-05-10 12:37:47,629] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. + 5: [2023-05-10 12:37:47,630] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +20: [2023-05-10 12:37:47,629] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +21: [2023-05-10 12:37:47,630] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt. +21: [2023-05-10 12:37:47,630] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt. +20: [2023-05-10 12:37:47,630] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt... +14: [2023-05-10 12:37:47,630] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +14: [2023-05-10 12:37:47,630] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +14: [2023-05-10 12:37:47,630] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +14: [2023-05-10 12:37:47,630] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +14: [2023-05-10 12:37:47,630] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +14: [2023-05-10 12:37:47,630] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +14: [2023-05-10 12:37:47,630] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +16: [2023-05-10 12:37:47,630] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt... +14: [2023-05-10 12:37:47,630] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... + 8: [2023-05-10 12:37:47,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. + 8: [2023-05-10 12:37:47,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +21: [2023-05-10 12:37:47,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt. + 8: [2023-05-10 12:37:47,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +21: [2023-05-10 12:37:47,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt. + 8: [2023-05-10 12:37:47,631] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... + 5: [2023-05-10 12:37:47,631] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt... + 8: [2023-05-10 12:37:47,631] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt... + 8: [2023-05-10 12:37:47,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. + 8: [2023-05-10 12:37:47,631] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt... + 8: [2023-05-10 12:37:47,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. + 8: [2023-05-10 12:37:47,631] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt... + 8: [2023-05-10 12:37:47,631] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt... + 8: [2023-05-10 12:37:47,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. + 8: [2023-05-10 12:37:47,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. + 8: [2023-05-10 12:37:47,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. + 8: [2023-05-10 12:37:47,632] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... + 8: [2023-05-10 12:37:47,632] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... + 8: [2023-05-10 12:37:47,632] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +16: [2023-05-10 12:37:47,632] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +16: [2023-05-10 12:37:47,632] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt... +16: [2023-05-10 12:37:47,632] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +16: [2023-05-10 12:37:47,632] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt... +19: [2023-05-10 12:37:47,632] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt. +19: [2023-05-10 12:37:47,632] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt. +19: [2023-05-10 12:37:47,632] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt. +19: [2023-05-10 12:37:47,632] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_32-model_01-model_states.pt. +13: [2023-05-10 12:37:47,633] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. + 4: [2023-05-10 12:37:47,633] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. + 4: [2023-05-10 12:37:47,634] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt... +25: [2023-05-10 12:37:47,635] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +16: [2023-05-10 12:37:47,635] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +16: [2023-05-10 12:37:47,635] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt... +25: [2023-05-10 12:37:47,636] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +13: [2023-05-10 12:37:47,636] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +22: [2023-05-10 12:37:47,637] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +13: [2023-05-10 12:37:47,637] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt... + 2: [2023-05-10 12:37:47,637] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. + 2: [2023-05-10 12:37:47,637] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +26: [2023-05-10 12:37:47,638] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +25: [2023-05-10 12:37:47,638] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +25: [2023-05-10 12:37:47,638] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +26: [2023-05-10 12:37:47,638] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +20: [2023-05-10 12:37:47,638] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +13: [2023-05-10 12:37:47,638] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... + 2: [2023-05-10 12:37:47,639] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt... + 2: [2023-05-10 12:37:47,639] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt... +20: [2023-05-10 12:37:47,639] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt... +21: [2023-05-10 12:37:47,640] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +26: [2023-05-10 12:37:47,640] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt... +21: [2023-05-10 12:37:47,640] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +21: [2023-05-10 12:37:47,640] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +19: [2023-05-10 12:37:47,641] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... + 8: [2023-05-10 12:37:47,641] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +20: [2023-05-10 12:37:47,641] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +20: [2023-05-10 12:37:47,642] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +13: [2023-05-10 12:37:47,642] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +21: [2023-05-10 12:37:47,642] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +20: [2023-05-10 12:37:47,643] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt... +20: [2023-05-10 12:37:47,644] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt... + 5: [2023-05-10 12:37:47,645] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. + 5: [2023-05-10 12:37:47,645] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. + 5: [2023-05-10 12:37:47,645] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. + 5: [2023-05-10 12:37:47,645] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... + 5: [2023-05-10 12:37:47,645] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... + 5: [2023-05-10 12:37:47,645] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... + 5: [2023-05-10 12:37:47,645] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. + 5: [2023-05-10 12:37:47,645] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +19: [2023-05-10 12:37:47,646] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +19: [2023-05-10 12:37:47,646] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... +26: [2023-05-10 12:37:47,646] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +14: [2023-05-10 12:37:47,646] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +14: [2023-05-10 12:37:47,646] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +14: [2023-05-10 12:37:47,646] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +14: [2023-05-10 12:37:47,646] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +19: [2023-05-10 12:37:47,648] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt... + 1: [2023-05-10 12:37:47,649] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +25: [2023-05-10 12:37:47,649] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +23: [2023-05-10 12:37:47,649] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. + 1: [2023-05-10 12:37:47,649] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... + 1: [2023-05-10 12:37:47,649] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +23: [2023-05-10 12:37:47,649] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... + 1: [2023-05-10 12:37:47,649] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +23: [2023-05-10 12:37:47,649] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. + 1: [2023-05-10 12:37:47,649] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +23: [2023-05-10 12:37:47,649] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +25: [2023-05-10 12:37:47,649] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt... +23: [2023-05-10 12:37:47,649] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +23: [2023-05-10 12:37:47,649] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +23: [2023-05-10 12:37:47,649] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +23: [2023-05-10 12:37:47,649] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +23: [2023-05-10 12:37:47,649] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. + 1: [2023-05-10 12:37:47,650] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... + 1: [2023-05-10 12:37:47,650] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. + 1: [2023-05-10 12:37:47,650] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +23: [2023-05-10 12:37:47,650] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +23: [2023-05-10 12:37:47,650] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +23: [2023-05-10 12:37:47,650] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... + 1: [2023-05-10 12:37:47,650] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. + 1: [2023-05-10 12:37:47,650] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. + 1: [2023-05-10 12:37:47,650] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... + 1: [2023-05-10 12:37:47,650] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... + 1: [2023-05-10 12:37:47,650] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt... + 1: [2023-05-10 12:37:47,650] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt... +23: [2023-05-10 12:37:47,650] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt... +23: [2023-05-10 12:37:47,650] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt... +23: [2023-05-10 12:37:47,650] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt... +23: [2023-05-10 12:37:47,650] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt... + 1: [2023-05-10 12:37:47,650] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt... +25: [2023-05-10 12:37:47,650] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +25: [2023-05-10 12:37:47,650] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt... + 1: [2023-05-10 12:37:47,651] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt... + 8: [2023-05-10 12:37:47,651] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... + 8: [2023-05-10 12:37:47,652] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. + 8: [2023-05-10 12:37:47,652] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. + 8: [2023-05-10 12:37:47,652] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +25: [2023-05-10 12:37:47,653] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +25: [2023-05-10 12:37:47,653] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt... +21: [2023-05-10 12:37:47,653] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +21: [2023-05-10 12:37:47,654] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt... +19: [2023-05-10 12:37:47,654] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +19: [2023-05-10 12:37:47,655] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt... +14: [2023-05-10 12:37:47,655] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +14: [2023-05-10 12:37:47,656] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +14: [2023-05-10 12:37:47,656] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +14: [2023-05-10 12:37:47,657] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +21: [2023-05-10 12:37:47,658] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +21: [2023-05-10 12:37:47,658] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt... +25: [2023-05-10 12:37:47,659] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +25: [2023-05-10 12:37:47,661] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt... +23: [2023-05-10 12:37:47,660] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. + 5: [2023-05-10 12:37:47,661] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. + 5: [2023-05-10 12:37:47,661] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. + 8: [2023-05-10 12:37:47,661] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +16: [2023-05-10 12:37:47,661] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. + 5: [2023-05-10 12:37:47,661] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. + 5: [2023-05-10 12:37:47,661] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +16: [2023-05-10 12:37:47,661] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +16: [2023-05-10 12:37:47,661] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +16: [2023-05-10 12:37:47,661] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +16: [2023-05-10 12:37:47,662] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +16: [2023-05-10 12:37:47,662] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +16: [2023-05-10 12:37:47,662] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +16: [2023-05-10 12:37:47,662] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... + 8: [2023-05-10 12:37:47,662] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +17: [2023-05-10 12:37:47,662] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +17: [2023-05-10 12:37:47,662] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +17: [2023-05-10 12:37:47,662] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +17: [2023-05-10 12:37:47,662] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +17: [2023-05-10 12:37:47,662] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +17: [2023-05-10 12:37:47,663] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +23: [2023-05-10 12:37:47,663] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. + 1: [2023-05-10 12:37:47,664] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +21: [2023-05-10 12:37:47,664] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +23: [2023-05-10 12:37:47,664] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +21: [2023-05-10 12:37:47,664] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt... + 1: [2023-05-10 12:37:47,664] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. + 8: [2023-05-10 12:37:47,664] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +17: [2023-05-10 12:37:47,664] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +17: [2023-05-10 12:37:47,664] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +23: [2023-05-10 12:37:47,665] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. + 1: [2023-05-10 12:37:47,667] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. + 1: [2023-05-10 12:37:47,667] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +23: [2023-05-10 12:37:47,670] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +19: [2023-05-10 12:37:47,670] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +19: [2023-05-10 12:37:47,672] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt... +21: [2023-05-10 12:37:47,671] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +21: [2023-05-10 12:37:47,673] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt... + 5: [2023-05-10 12:37:47,673] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +19: [2023-05-10 12:37:47,673] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. + 5: [2023-05-10 12:37:47,673] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... + 5: [2023-05-10 12:37:47,673] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... + 5: [2023-05-10 12:37:47,673] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... + 1: [2023-05-10 12:37:47,673] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +23: [2023-05-10 12:37:47,674] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +19: [2023-05-10 12:37:47,674] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt... +19: [2023-05-10 12:37:47,675] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_00-model_states.pt. +17: [2023-05-10 12:37:47,675] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +16: [2023-05-10 12:37:47,675] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +16: [2023-05-10 12:37:47,675] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. + 1: [2023-05-10 12:37:47,676] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +23: [2023-05-10 12:37:47,676] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +19: [2023-05-10 12:37:47,677] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt... + 1: [2023-05-10 12:37:47,677] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +16: [2023-05-10 12:37:47,677] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +16: [2023-05-10 12:37:47,677] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +23: [2023-05-10 12:37:47,677] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... + 1: [2023-05-10 12:37:47,679] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +17: [2023-05-10 12:37:47,684] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +16: [2023-05-10 12:37:47,685] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +17: [2023-05-10 12:37:47,686] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +16: [2023-05-10 12:37:47,689] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +16: [2023-05-10 12:37:47,689] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +16: [2023-05-10 12:37:47,689] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +17: [2023-05-10 12:37:47,691] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +17: [2023-05-10 12:37:47,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +17: [2023-05-10 12:37:47,698] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +17: [2023-05-10 12:37:47,700] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +15: [2023-05-10 12:37:47,702] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt. +15: [2023-05-10 12:37:47,702] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt. +15: [2023-05-10 12:37:47,702] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt. +15: [2023-05-10 12:37:47,702] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt. +17: [2023-05-10 12:37:47,706] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +21: [2023-05-10 12:37:47,710] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +21: [2023-05-10 12:37:47,710] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +18: [2023-05-10 12:37:47,709] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +18: [2023-05-10 12:37:47,709] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +18: [2023-05-10 12:37:47,709] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +21: [2023-05-10 12:37:47,710] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +18: [2023-05-10 12:37:47,709] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +18: [2023-05-10 12:37:47,709] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +18: [2023-05-10 12:37:47,709] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +21: [2023-05-10 12:37:47,710] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +18: [2023-05-10 12:37:47,710] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +18: [2023-05-10 12:37:47,711] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... + 0: [2023-05-10 12:37:47,712] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. + 0: [2023-05-10 12:37:47,712] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +10: [2023-05-10 12:37:47,712] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt. +10: [2023-05-10 12:37:47,712] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt. +15: [2023-05-10 12:37:47,712] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +10: [2023-05-10 12:37:47,712] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt. +21: [2023-05-10 12:37:47,712] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +21: [2023-05-10 12:37:47,712] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +10: [2023-05-10 12:37:47,712] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt. +15: [2023-05-10 12:37:47,713] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +15: [2023-05-10 12:37:47,713] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +29: [2023-05-10 12:37:47,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +29: [2023-05-10 12:37:47,713] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +29: [2023-05-10 12:37:47,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +29: [2023-05-10 12:37:47,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. + 0: [2023-05-10 12:37:47,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +25: [2023-05-10 12:37:47,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +25: [2023-05-10 12:37:47,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +25: [2023-05-10 12:37:47,713] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +29: [2023-05-10 12:37:47,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +25: [2023-05-10 12:37:47,713] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +29: [2023-05-10 12:37:47,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +29: [2023-05-10 12:37:47,714] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt... +29: [2023-05-10 12:37:47,714] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt... +29: [2023-05-10 12:37:47,714] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... + 7: [2023-05-10 12:37:47,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +11: [2023-05-10 12:37:47,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt. +11: [2023-05-10 12:37:47,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt. +29: [2023-05-10 12:37:47,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +29: [2023-05-10 12:37:47,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +29: [2023-05-10 12:37:47,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +11: [2023-05-10 12:37:47,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt. +19: [2023-05-10 12:37:47,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. + 6: [2023-05-10 12:37:47,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. + 6: [2023-05-10 12:37:47,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +10: [2023-05-10 12:37:47,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +10: [2023-05-10 12:37:47,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +19: [2023-05-10 12:37:47,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +19: [2023-05-10 12:37:47,714] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... + 7: [2023-05-10 12:37:47,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +11: [2023-05-10 12:37:47,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt. +19: [2023-05-10 12:37:47,714] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... + 7: [2023-05-10 12:37:47,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. + 6: [2023-05-10 12:37:47,714] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +19: [2023-05-10 12:37:47,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. + 7: [2023-05-10 12:37:47,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +10: [2023-05-10 12:37:47,714] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... + 6: [2023-05-10 12:37:47,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. + 7: [2023-05-10 12:37:47,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. + 0: [2023-05-10 12:37:47,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. + 0: [2023-05-10 12:37:47,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +10: [2023-05-10 12:37:47,714] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +21: [2023-05-10 12:37:47,714] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... + 7: [2023-05-10 12:37:47,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. + 7: [2023-05-10 12:37:47,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. + 7: [2023-05-10 12:37:47,714] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +25: [2023-05-10 12:37:47,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. + 7: [2023-05-10 12:37:47,714] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... + 7: [2023-05-10 12:37:47,714] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +19: [2023-05-10 12:37:47,714] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +19: [2023-05-10 12:37:47,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +25: [2023-05-10 12:37:47,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. + 7: [2023-05-10 12:37:47,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +21: [2023-05-10 12:37:47,714] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +19: [2023-05-10 12:37:47,714] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... + 7: [2023-05-10 12:37:47,714] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt... + 6: [2023-05-10 12:37:47,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. + 6: [2023-05-10 12:37:47,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. + 6: [2023-05-10 12:37:47,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. + 6: [2023-05-10 12:37:47,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. + 6: [2023-05-10 12:37:47,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. + 6: [2023-05-10 12:37:47,714] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt... + 7: [2023-05-10 12:37:47,714] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt... + 6: [2023-05-10 12:37:47,714] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... + 6: [2023-05-10 12:37:47,714] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... + 6: [2023-05-10 12:37:47,714] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt... + 6: [2023-05-10 12:37:47,714] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt... +29: [2023-05-10 12:37:47,715] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt... + 7: [2023-05-10 12:37:47,715] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt... +15: [2023-05-10 12:37:47,715] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +25: [2023-05-10 12:37:47,715] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... + 7: [2023-05-10 12:37:47,716] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... + 7: [2023-05-10 12:37:47,716] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt... + 6: [2023-05-10 12:37:47,716] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +29: [2023-05-10 12:37:47,716] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... + 0: [2023-05-10 12:37:47,716] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +29: [2023-05-10 12:37:47,716] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... + 6: [2023-05-10 12:37:47,716] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt... + 0: [2023-05-10 12:37:47,716] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +29: [2023-05-10 12:37:47,716] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt... +25: [2023-05-10 12:37:47,716] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... + 0: [2023-05-10 12:37:47,716] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +10: [2023-05-10 12:37:47,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +10: [2023-05-10 12:37:47,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +10: [2023-05-10 12:37:47,720] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +10: [2023-05-10 12:37:47,721] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +10: [2023-05-10 12:37:47,722] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +11: [2023-05-10 12:37:47,723] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +11: [2023-05-10 12:37:47,723] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +10: [2023-05-10 12:37:47,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +29: [2023-05-10 12:37:47,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +10: [2023-05-10 12:37:47,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +25: [2023-05-10 12:37:47,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +11: [2023-05-10 12:37:47,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +10: [2023-05-10 12:37:47,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +25: [2023-05-10 12:37:47,725] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +21: [2023-05-10 12:37:47,726] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +21: [2023-05-10 12:37:47,726] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +19: [2023-05-10 12:37:47,726] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. + 6: [2023-05-10 12:37:47,726] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +11: [2023-05-10 12:37:47,726] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... + 0: [2023-05-10 12:37:47,729] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. + 6: [2023-05-10 12:37:47,729] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. + 6: [2023-05-10 12:37:47,729] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +19: [2023-05-10 12:37:47,729] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +19: [2023-05-10 12:37:47,729] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +18: [2023-05-10 12:37:47,730] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +18: [2023-05-10 12:37:47,730] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +18: [2023-05-10 12:37:47,730] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +29: [2023-05-10 12:37:47,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +19: [2023-05-10 12:37:47,733] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. + 7: [2023-05-10 12:37:47,733] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. + 7: [2023-05-10 12:37:47,733] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +10: [2023-05-10 12:37:47,734] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +10: [2023-05-10 12:37:47,734] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +21: [2023-05-10 12:37:47,734] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +15: [2023-05-10 12:37:47,734] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +15: [2023-05-10 12:37:47,734] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +15: [2023-05-10 12:37:47,735] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt... +15: [2023-05-10 12:37:47,735] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt... +25: [2023-05-10 12:37:47,735] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +25: [2023-05-10 12:37:47,735] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +21: [2023-05-10 12:37:47,736] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +11: [2023-05-10 12:37:47,736] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. + 0: [2023-05-10 12:37:47,736] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt. + 0: [2023-05-10 12:37:47,736] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt. +29: [2023-05-10 12:37:47,736] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +11: [2023-05-10 12:37:47,736] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt... + 6: [2023-05-10 12:37:47,738] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +25: [2023-05-10 12:37:47,738] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. + 6: [2023-05-10 12:37:47,739] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... + 6: [2023-05-10 12:37:47,739] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... + 5: [2023-05-10 12:37:47,739] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt. + 5: [2023-05-10 12:37:47,739] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt. + 0: [2023-05-10 12:37:47,739] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt. + 7: [2023-05-10 12:37:47,739] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. + 0: [2023-05-10 12:37:47,739] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt. +19: [2023-05-10 12:37:47,740] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +11: [2023-05-10 12:37:47,739] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +11: [2023-05-10 12:37:47,740] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt... + 7: [2023-05-10 12:37:47,740] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. + 5: [2023-05-10 12:37:47,740] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt. +18: [2023-05-10 12:37:47,740] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +19: [2023-05-10 12:37:47,740] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +19: [2023-05-10 12:37:47,740] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... + 5: [2023-05-10 12:37:47,741] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt. +18: [2023-05-10 12:37:47,741] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +21: [2023-05-10 12:37:47,740] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +21: [2023-05-10 12:37:47,741] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +18: [2023-05-10 12:37:47,741] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +17: [2023-05-10 12:37:47,740] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt. +17: [2023-05-10 12:37:47,740] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt. +17: [2023-05-10 12:37:47,741] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt. +17: [2023-05-10 12:37:47,741] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt. +11: [2023-05-10 12:37:47,742] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +11: [2023-05-10 12:37:47,742] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt... + 0: [2023-05-10 12:37:47,742] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +10: [2023-05-10 12:37:47,742] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +19: [2023-05-10 12:37:47,742] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +15: [2023-05-10 12:37:47,742] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. + 7: [2023-05-10 12:37:47,743] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +15: [2023-05-10 12:37:47,743] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. + 7: [2023-05-10 12:37:47,743] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +10: [2023-05-10 12:37:47,743] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt... +29: [2023-05-10 12:37:47,743] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +15: [2023-05-10 12:37:47,744] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt... +15: [2023-05-10 12:37:47,744] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt... +10: [2023-05-10 12:37:47,746] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +10: [2023-05-10 12:37:47,746] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... + 6: [2023-05-10 12:37:47,746] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +25: [2023-05-10 12:37:47,747] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +25: [2023-05-10 12:37:47,747] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... + 0: [2023-05-10 12:37:47,748] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... + 0: [2023-05-10 12:37:47,748] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +29: [2023-05-10 12:37:47,748] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. + 5: [2023-05-10 12:37:47,749] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... + 7: [2023-05-10 12:37:47,749] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +29: [2023-05-10 12:37:47,749] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. + 7: [2023-05-10 12:37:47,749] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +18: [2023-05-10 12:37:47,749] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +14: [2023-05-10 12:37:47,750] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt. + 5: [2023-05-10 12:37:47,750] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +14: [2023-05-10 12:37:47,751] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt. +14: [2023-05-10 12:37:47,751] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt. +14: [2023-05-10 12:37:47,751] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt. +17: [2023-05-10 12:37:47,751] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +17: [2023-05-10 12:37:47,751] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +11: [2023-05-10 12:37:47,751] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +17: [2023-05-10 12:37:47,751] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +17: [2023-05-10 12:37:47,751] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... + 5: [2023-05-10 12:37:47,751] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... + 5: [2023-05-10 12:37:47,751] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +21: [2023-05-10 12:37:47,752] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +11: [2023-05-10 12:37:47,752] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt... +21: [2023-05-10 12:37:47,752] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +10: [2023-05-10 12:37:47,752] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +10: [2023-05-10 12:37:47,752] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +10: [2023-05-10 12:37:47,752] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +10: [2023-05-10 12:37:47,752] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +10: [2023-05-10 12:37:47,754] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt... +10: [2023-05-10 12:37:47,754] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt... +10: [2023-05-10 12:37:47,754] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt... + 6: [2023-05-10 12:37:47,754] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... + 2: [2023-05-10 12:37:47,754] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. + 2: [2023-05-10 12:37:47,754] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. + 2: [2023-05-10 12:37:47,754] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... + 2: [2023-05-10 12:37:47,754] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... + 2: [2023-05-10 12:37:47,754] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. + 2: [2023-05-10 12:37:47,754] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. + 2: [2023-05-10 12:37:47,754] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +25: [2023-05-10 12:37:47,755] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... + 0: [2023-05-10 12:37:47,755] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... + 2: [2023-05-10 12:37:47,756] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... + 0: [2023-05-10 12:37:47,756] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +18: [2023-05-10 12:37:47,757] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +29: [2023-05-10 12:37:47,758] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +29: [2023-05-10 12:37:47,759] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +10: [2023-05-10 12:37:47,759] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +10: [2023-05-10 12:37:47,761] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... + 0: [2023-05-10 12:37:47,761] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. + 0: [2023-05-10 12:37:47,761] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +14: [2023-05-10 12:37:47,761] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +14: [2023-05-10 12:37:47,762] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +14: [2023-05-10 12:37:47,762] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +14: [2023-05-10 12:37:47,763] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... + 2: [2023-05-10 12:37:47,765] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. + 2: [2023-05-10 12:37:47,765] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. + 5: [2023-05-10 12:37:47,767] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. + 5: [2023-05-10 12:37:47,767] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. + 5: [2023-05-10 12:37:47,767] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt... + 5: [2023-05-10 12:37:47,767] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt... + 5: [2023-05-10 12:37:47,768] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. + 5: [2023-05-10 12:37:47,768] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt... +17: [2023-05-10 12:37:47,768] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +17: [2023-05-10 12:37:47,768] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +10: [2023-05-10 12:37:47,768] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +17: [2023-05-10 12:37:47,768] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt... +17: [2023-05-10 12:37:47,768] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt... + 2: [2023-05-10 12:37:47,768] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +31: [2023-05-10 12:37:47,770] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +31: [2023-05-10 12:37:47,770] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +31: [2023-05-10 12:37:47,770] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +31: [2023-05-10 12:37:47,770] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +17: [2023-05-10 12:37:47,770] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +31: [2023-05-10 12:37:47,770] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +31: [2023-05-10 12:37:47,770] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +17: [2023-05-10 12:37:47,770] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt... +31: [2023-05-10 12:37:47,771] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +31: [2023-05-10 12:37:47,771] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... + 0: [2023-05-10 12:37:47,772] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. + 0: [2023-05-10 12:37:47,772] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... + 0: [2023-05-10 12:37:47,772] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +14: [2023-05-10 12:37:47,773] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +14: [2023-05-10 12:37:47,774] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt... +14: [2023-05-10 12:37:47,777] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. + 2: [2023-05-10 12:37:47,777] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +14: [2023-05-10 12:37:47,777] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt... + 2: [2023-05-10 12:37:47,778] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... + 2: [2023-05-10 12:37:47,778] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... + 0: [2023-05-10 12:37:47,778] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. + 0: [2023-05-10 12:37:47,778] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +17: [2023-05-10 12:37:47,779] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. + 5: [2023-05-10 12:37:47,779] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. + 5: [2023-05-10 12:37:47,779] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt... + 0: [2023-05-10 12:37:47,780] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt... + 0: [2023-05-10 12:37:47,780] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt... +17: [2023-05-10 12:37:47,780] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt... + 2: [2023-05-10 12:37:47,781] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +31: [2023-05-10 12:37:47,781] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +14: [2023-05-10 12:37:47,782] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. + 0: [2023-05-10 12:37:47,782] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +31: [2023-05-10 12:37:47,782] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +14: [2023-05-10 12:37:47,782] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt... +21: [2023-05-10 12:37:47,785] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt. +21: [2023-05-10 12:37:47,785] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt. +21: [2023-05-10 12:37:47,785] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt. +31: [2023-05-10 12:37:47,785] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. + 2: [2023-05-10 12:37:47,786] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +21: [2023-05-10 12:37:47,786] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt. +31: [2023-05-10 12:37:47,787] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +18: [2023-05-10 12:37:47,788] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt. +18: [2023-05-10 12:37:47,788] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt. +18: [2023-05-10 12:37:47,788] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt. +18: [2023-05-10 12:37:47,788] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt. +27: [2023-05-10 12:37:47,788] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt. +27: [2023-05-10 12:37:47,788] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt. +31: [2023-05-10 12:37:47,790] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... + 0: [2023-05-10 12:37:47,791] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +27: [2023-05-10 12:37:47,791] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt. +27: [2023-05-10 12:37:47,792] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt. +31: [2023-05-10 12:37:47,792] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +13: [2023-05-10 12:37:47,792] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt. +14: [2023-05-10 12:37:47,792] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +13: [2023-05-10 12:37:47,793] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt. +13: [2023-05-10 12:37:47,793] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt. + 0: [2023-05-10 12:37:47,793] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt... +13: [2023-05-10 12:37:47,793] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt. +14: [2023-05-10 12:37:47,794] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt... +21: [2023-05-10 12:37:47,794] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +31: [2023-05-10 12:37:47,795] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +31: [2023-05-10 12:37:47,796] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... + 0: [2023-05-10 12:37:47,796] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +21: [2023-05-10 12:37:47,796] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +21: [2023-05-10 12:37:47,796] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +18: [2023-05-10 12:37:47,797] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +18: [2023-05-10 12:37:47,797] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +21: [2023-05-10 12:37:47,798] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +18: [2023-05-10 12:37:47,798] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... + 0: [2023-05-10 12:37:47,799] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt... +18: [2023-05-10 12:37:47,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +27: [2023-05-10 12:37:47,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +27: [2023-05-10 12:37:47,801] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +27: [2023-05-10 12:37:47,801] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +27: [2023-05-10 12:37:47,801] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +13: [2023-05-10 12:37:47,802] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +13: [2023-05-10 12:37:47,802] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +13: [2023-05-10 12:37:47,802] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... + 4: [2023-05-10 12:37:47,802] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt. + 4: [2023-05-10 12:37:47,802] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt. +13: [2023-05-10 12:37:47,804] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... + 4: [2023-05-10 12:37:47,805] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt. + 4: [2023-05-10 12:37:47,805] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt. +21: [2023-05-10 12:37:47,809] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +21: [2023-05-10 12:37:47,810] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt... + 4: [2023-05-10 12:37:47,811] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +27: [2023-05-10 12:37:47,812] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +18: [2023-05-10 12:37:47,812] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +27: [2023-05-10 12:37:47,812] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt... +18: [2023-05-10 12:37:47,812] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt... +18: [2023-05-10 12:37:47,813] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. + 9: [2023-05-10 12:37:47,813] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt. + 9: [2023-05-10 12:37:47,813] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt. + 9: [2023-05-10 12:37:47,813] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt. +18: [2023-05-10 12:37:47,814] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt... + 9: [2023-05-10 12:37:47,814] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt. + 4: [2023-05-10 12:37:47,814] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... + 4: [2023-05-10 12:37:47,814] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +21: [2023-05-10 12:37:47,816] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +21: [2023-05-10 12:37:47,816] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt... +13: [2023-05-10 12:37:47,815] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +18: [2023-05-10 12:37:47,816] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +13: [2023-05-10 12:37:47,816] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt... +21: [2023-05-10 12:37:47,817] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. + 4: [2023-05-10 12:37:47,817] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +21: [2023-05-10 12:37:47,817] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt... +18: [2023-05-10 12:37:47,817] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt... +27: [2023-05-10 12:37:47,819] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +27: [2023-05-10 12:37:47,819] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt... +13: [2023-05-10 12:37:47,820] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +13: [2023-05-10 12:37:47,820] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +13: [2023-05-10 12:37:47,820] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt... +13: [2023-05-10 12:37:47,820] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt... + 9: [2023-05-10 12:37:47,823] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +18: [2023-05-10 12:37:47,824] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. + 9: [2023-05-10 12:37:47,824] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... + 9: [2023-05-10 12:37:47,824] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... + 9: [2023-05-10 12:37:47,825] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +27: [2023-05-10 12:37:47,825] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +27: [2023-05-10 12:37:47,825] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +27: [2023-05-10 12:37:47,826] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt... +18: [2023-05-10 12:37:47,826] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt... +27: [2023-05-10 12:37:47,826] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt... + 4: [2023-05-10 12:37:47,827] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. + 4: [2023-05-10 12:37:47,827] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt... +21: [2023-05-10 12:37:47,828] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +13: [2023-05-10 12:37:47,828] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. + 4: [2023-05-10 12:37:47,829] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +13: [2023-05-10 12:37:47,830] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt... + 4: [2023-05-10 12:37:47,830] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt... +21: [2023-05-10 12:37:47,830] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt... + 4: [2023-05-10 12:37:47,831] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. + 4: [2023-05-10 12:37:47,831] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt... + 9: [2023-05-10 12:37:47,836] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. + 9: [2023-05-10 12:37:47,837] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt... + 2: [2023-05-10 12:37:47,838] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt. + 2: [2023-05-10 12:37:47,839] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt. + 2: [2023-05-10 12:37:47,839] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt. +20: [2023-05-10 12:37:47,839] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt. + 2: [2023-05-10 12:37:47,839] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt. + 4: [2023-05-10 12:37:47,840] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +12: [2023-05-10 12:37:47,841] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt. + 4: [2023-05-10 12:37:47,841] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt... +12: [2023-05-10 12:37:47,841] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt. + 9: [2023-05-10 12:37:47,842] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. + 9: [2023-05-10 12:37:47,842] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt... + 9: [2023-05-10 12:37:47,842] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. + 9: [2023-05-10 12:37:47,842] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt... +20: [2023-05-10 12:37:47,843] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt. +24: [2023-05-10 12:37:47,843] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +24: [2023-05-10 12:37:47,843] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +24: [2023-05-10 12:37:47,843] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +24: [2023-05-10 12:37:47,843] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +24: [2023-05-10 12:37:47,843] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +24: [2023-05-10 12:37:47,843] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +24: [2023-05-10 12:37:47,844] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... + 9: [2023-05-10 12:37:47,844] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. + 9: [2023-05-10 12:37:47,844] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt... +24: [2023-05-10 12:37:47,844] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +12: [2023-05-10 12:37:47,844] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt. +12: [2023-05-10 12:37:47,845] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt. +20: [2023-05-10 12:37:47,846] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt. +20: [2023-05-10 12:37:47,847] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt. +16: [2023-05-10 12:37:47,847] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt. +16: [2023-05-10 12:37:47,847] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt. +16: [2023-05-10 12:37:47,847] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt. +16: [2023-05-10 12:37:47,847] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt. +25: [2023-05-10 12:37:47,847] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt. +25: [2023-05-10 12:37:47,847] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt. +25: [2023-05-10 12:37:47,847] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt. +20: [2023-05-10 12:37:47,848] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... + 2: [2023-05-10 12:37:47,848] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +19: [2023-05-10 12:37:47,848] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt. +19: [2023-05-10 12:37:47,849] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt. + 2: [2023-05-10 12:37:47,849] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +19: [2023-05-10 12:37:47,849] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt. +19: [2023-05-10 12:37:47,849] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt. + 2: [2023-05-10 12:37:47,850] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +25: [2023-05-10 12:37:47,850] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt. + 2: [2023-05-10 12:37:47,850] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +12: [2023-05-10 12:37:47,850] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +12: [2023-05-10 12:37:47,854] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +12: [2023-05-10 12:37:47,854] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +12: [2023-05-10 12:37:47,854] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +20: [2023-05-10 12:37:47,854] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +24: [2023-05-10 12:37:47,855] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +31: [2023-05-10 12:37:47,855] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt. +31: [2023-05-10 12:37:47,855] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt. +31: [2023-05-10 12:37:47,855] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt. +31: [2023-05-10 12:37:47,856] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_33-model_01-model_states.pt. +25: [2023-05-10 12:37:47,856] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +19: [2023-05-10 12:37:47,857] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +16: [2023-05-10 12:37:47,857] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +20: [2023-05-10 12:37:47,857] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +20: [2023-05-10 12:37:47,857] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +24: [2023-05-10 12:37:47,858] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +24: [2023-05-10 12:37:47,858] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +19: [2023-05-10 12:37:47,859] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +19: [2023-05-10 12:37:47,859] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +19: [2023-05-10 12:37:47,859] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +25: [2023-05-10 12:37:47,860] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +25: [2023-05-10 12:37:47,860] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +25: [2023-05-10 12:37:47,860] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +16: [2023-05-10 12:37:47,861] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +16: [2023-05-10 12:37:47,861] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +16: [2023-05-10 12:37:47,861] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +20: [2023-05-10 12:37:47,862] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. + 2: [2023-05-10 12:37:47,861] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. + 2: [2023-05-10 12:37:47,862] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt... +20: [2023-05-10 12:37:47,862] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt... +12: [2023-05-10 12:37:47,864] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +24: [2023-05-10 12:37:47,864] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +31: [2023-05-10 12:37:47,865] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +12: [2023-05-10 12:37:47,865] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt... +24: [2023-05-10 12:37:47,865] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt. +24: [2023-05-10 12:37:47,865] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt. +24: [2023-05-10 12:37:47,865] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt. +31: [2023-05-10 12:37:47,866] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +31: [2023-05-10 12:37:47,866] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +24: [2023-05-10 12:37:47,866] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt. +31: [2023-05-10 12:37:47,866] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt... +20: [2023-05-10 12:37:47,866] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +20: [2023-05-10 12:37:47,866] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt... +12: [2023-05-10 12:37:47,867] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +12: [2023-05-10 12:37:47,867] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt... +24: [2023-05-10 12:37:47,868] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... + 2: [2023-05-10 12:37:47,868] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. + 2: [2023-05-10 12:37:47,869] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt... +20: [2023-05-10 12:37:47,869] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +20: [2023-05-10 12:37:47,869] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt... +12: [2023-05-10 12:37:47,869] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +12: [2023-05-10 12:37:47,869] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +12: [2023-05-10 12:37:47,869] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +12: [2023-05-10 12:37:47,869] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +12: [2023-05-10 12:37:47,869] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +12: [2023-05-10 12:37:47,869] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... + 2: [2023-05-10 12:37:47,869] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. + 2: [2023-05-10 12:37:47,869] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. + 2: [2023-05-10 12:37:47,870] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt... +12: [2023-05-10 12:37:47,869] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. + 2: [2023-05-10 12:37:47,870] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt... +12: [2023-05-10 12:37:47,870] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +25: [2023-05-10 12:37:47,869] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +19: [2023-05-10 12:37:47,869] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +20: [2023-05-10 12:37:47,870] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +20: [2023-05-10 12:37:47,870] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt... +25: [2023-05-10 12:37:47,870] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt... +25: [2023-05-10 12:37:47,871] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +25: [2023-05-10 12:37:47,871] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt... +19: [2023-05-10 12:37:47,871] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt... +12: [2023-05-10 12:37:47,872] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +12: [2023-05-10 12:37:47,872] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt... +16: [2023-05-10 12:37:47,872] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +24: [2023-05-10 12:37:47,872] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +16: [2023-05-10 12:37:47,873] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt... +19: [2023-05-10 12:37:47,873] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +19: [2023-05-10 12:37:47,873] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt... +24: [2023-05-10 12:37:47,874] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +24: [2023-05-10 12:37:47,874] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +24: [2023-05-10 12:37:47,874] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +30: [2023-05-10 12:37:47,875] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt. +30: [2023-05-10 12:37:47,876] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt. +30: [2023-05-10 12:37:47,876] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt. +30: [2023-05-10 12:37:47,876] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt. +24: [2023-05-10 12:37:47,876] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +19: [2023-05-10 12:37:47,876] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +19: [2023-05-10 12:37:47,876] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +19: [2023-05-10 12:37:47,876] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt... +19: [2023-05-10 12:37:47,876] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt... +24: [2023-05-10 12:37:47,877] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +28: [2023-05-10 12:37:47,877] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +28: [2023-05-10 12:37:47,877] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... + 3: [2023-05-10 12:37:47,877] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt. + 3: [2023-05-10 12:37:47,877] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt. +28: [2023-05-10 12:37:47,877] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +28: [2023-05-10 12:37:47,877] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. + 3: [2023-05-10 12:37:47,877] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt. +28: [2023-05-10 12:37:47,877] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt. +28: [2023-05-10 12:37:47,877] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt. +28: [2023-05-10 12:37:47,878] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +28: [2023-05-10 12:37:47,878] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +28: [2023-05-10 12:37:47,878] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. + 3: [2023-05-10 12:37:47,878] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt. +28: [2023-05-10 12:37:47,878] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt. +28: [2023-05-10 12:37:47,878] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +28: [2023-05-10 12:37:47,878] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt. + 1: [2023-05-10 12:37:47,879] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt. + 1: [2023-05-10 12:37:47,879] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt. + 1: [2023-05-10 12:37:47,880] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt. + 1: [2023-05-10 12:37:47,880] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt. +23: [2023-05-10 12:37:47,880] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt. +23: [2023-05-10 12:37:47,880] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt. +23: [2023-05-10 12:37:47,880] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt. +23: [2023-05-10 12:37:47,880] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt. +12: [2023-05-10 12:37:47,880] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +25: [2023-05-10 12:37:47,881] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +12: [2023-05-10 12:37:47,882] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt... +25: [2023-05-10 12:37:47,882] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt... +31: [2023-05-10 12:37:47,883] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +24: [2023-05-10 12:37:47,884] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +31: [2023-05-10 12:37:47,884] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +31: [2023-05-10 12:37:47,884] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt... +30: [2023-05-10 12:37:47,884] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +12: [2023-05-10 12:37:47,885] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +31: [2023-05-10 12:37:47,886] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt... +16: [2023-05-10 12:37:47,886] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +16: [2023-05-10 12:37:47,886] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +12: [2023-05-10 12:37:47,886] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +12: [2023-05-10 12:37:47,886] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +31: [2023-05-10 12:37:47,887] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +30: [2023-05-10 12:37:47,887] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +16: [2023-05-10 12:37:47,887] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt... +30: [2023-05-10 12:37:47,887] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +16: [2023-05-10 12:37:47,887] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt... +30: [2023-05-10 12:37:47,887] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +28: [2023-05-10 12:37:47,887] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +16: [2023-05-10 12:37:47,888] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +25: [2023-05-10 12:37:47,887] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +25: [2023-05-10 12:37:47,888] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt... +28: [2023-05-10 12:37:47,888] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +31: [2023-05-10 12:37:47,888] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt... +23: [2023-05-10 12:37:47,889] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +23: [2023-05-10 12:37:47,889] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... + 3: [2023-05-10 12:37:47,889] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... + 1: [2023-05-10 12:37:47,889] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +28: [2023-05-10 12:37:47,889] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +16: [2023-05-10 12:37:47,889] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt... + 1: [2023-05-10 12:37:47,889] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... + 3: [2023-05-10 12:37:47,889] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +24: [2023-05-10 12:37:47,890] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +14: [2023-05-10 12:37:47,890] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +14: [2023-05-10 12:37:47,890] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... + 8: [2023-05-10 12:37:47,890] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. + 8: [2023-05-10 12:37:47,890] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. + 8: [2023-05-10 12:37:47,890] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. + 8: [2023-05-10 12:37:47,890] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... + 3: [2023-05-10 12:37:47,890] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... + 1: [2023-05-10 12:37:47,890] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +14: [2023-05-10 12:37:47,890] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +14: [2023-05-10 12:37:47,891] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... + 3: [2023-05-10 12:37:47,891] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +24: [2023-05-10 12:37:47,891] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt... + 1: [2023-05-10 12:37:47,891] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... + 8: [2023-05-10 12:37:47,891] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. + 8: [2023-05-10 12:37:47,891] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... + 8: [2023-05-10 12:37:47,892] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +12: [2023-05-10 12:37:47,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +23: [2023-05-10 12:37:47,892] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... + 8: [2023-05-10 12:37:47,892] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +31: [2023-05-10 12:37:47,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_00-model_states.pt. +23: [2023-05-10 12:37:47,892] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +24: [2023-05-10 12:37:47,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +28: [2023-05-10 12:37:47,891] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +14: [2023-05-10 12:37:47,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +14: [2023-05-10 12:37:47,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +31: [2023-05-10 12:37:47,893] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt... +14: [2023-05-10 12:37:47,894] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +12: [2023-05-10 12:37:47,894] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +24: [2023-05-10 12:37:47,894] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt... +14: [2023-05-10 12:37:47,894] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +24: [2023-05-10 12:37:47,896] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +24: [2023-05-10 12:37:47,897] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt... +12: [2023-05-10 12:37:47,897] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +12: [2023-05-10 12:37:47,898] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +24: [2023-05-10 12:37:47,898] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +26: [2023-05-10 12:37:47,899] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt. +26: [2023-05-10 12:37:47,899] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt. +28: [2023-05-10 12:37:47,899] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +24: [2023-05-10 12:37:47,900] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt... +12: [2023-05-10 12:37:47,900] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +26: [2023-05-10 12:37:47,902] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt. +26: [2023-05-10 12:37:47,902] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt. +14: [2023-05-10 12:37:47,902] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +28: [2023-05-10 12:37:47,904] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +28: [2023-05-10 12:37:47,904] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +14: [2023-05-10 12:37:47,904] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +28: [2023-05-10 12:37:47,907] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. + 8: [2023-05-10 12:37:47,907] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt. + 8: [2023-05-10 12:37:47,907] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt. +28: [2023-05-10 12:37:47,908] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt... + 8: [2023-05-10 12:37:47,909] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt. +28: [2023-05-10 12:37:47,909] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... + 8: [2023-05-10 12:37:47,909] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt. +17: [2023-05-10 12:37:47,909] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +17: [2023-05-10 12:37:47,909] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +17: [2023-05-10 12:37:47,909] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +17: [2023-05-10 12:37:47,909] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +17: [2023-05-10 12:37:47,909] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +17: [2023-05-10 12:37:47,909] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +17: [2023-05-10 12:37:47,909] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +28: [2023-05-10 12:37:47,910] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +28: [2023-05-10 12:37:47,911] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt... +17: [2023-05-10 12:37:47,911] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +26: [2023-05-10 12:37:47,911] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +26: [2023-05-10 12:37:47,911] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +26: [2023-05-10 12:37:47,912] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +26: [2023-05-10 12:37:47,912] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +14: [2023-05-10 12:37:47,912] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +28: [2023-05-10 12:37:47,914] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +14: [2023-05-10 12:37:47,914] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +28: [2023-05-10 12:37:47,914] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +28: [2023-05-10 12:37:47,914] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +28: [2023-05-10 12:37:47,915] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +28: [2023-05-10 12:37:47,915] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt... + 8: [2023-05-10 12:37:47,915] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. + 8: [2023-05-10 12:37:47,916] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. + 8: [2023-05-10 12:37:47,917] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... + 8: [2023-05-10 12:37:47,917] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +14: [2023-05-10 12:37:47,918] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +10: [2023-05-10 12:37:47,919] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt. + 8: [2023-05-10 12:37:47,920] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +17: [2023-05-10 12:37:47,921] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +10: [2023-05-10 12:37:47,922] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt. +10: [2023-05-10 12:37:47,923] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt. +10: [2023-05-10 12:37:47,923] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt. +28: [2023-05-10 12:37:47,925] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +14: [2023-05-10 12:37:47,925] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +28: [2023-05-10 12:37:47,925] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +28: [2023-05-10 12:37:47,926] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt... + 8: [2023-05-10 12:37:47,926] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +17: [2023-05-10 12:37:47,927] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +17: [2023-05-10 12:37:47,927] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +14: [2023-05-10 12:37:47,927] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +17: [2023-05-10 12:37:47,929] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +10: [2023-05-10 12:37:47,929] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... + 8: [2023-05-10 12:37:47,929] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... + 8: [2023-05-10 12:37:47,930] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... + 8: [2023-05-10 12:37:47,930] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +11: [2023-05-10 12:37:47,930] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt. +11: [2023-05-10 12:37:47,931] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt. +11: [2023-05-10 12:37:47,931] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt. + 8: [2023-05-10 12:37:47,931] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +30: [2023-05-10 12:37:47,931] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +30: [2023-05-10 12:37:47,931] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +30: [2023-05-10 12:37:47,931] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +30: [2023-05-10 12:37:47,931] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +11: [2023-05-10 12:37:47,931] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt. +30: [2023-05-10 12:37:47,931] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +30: [2023-05-10 12:37:47,931] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +30: [2023-05-10 12:37:47,931] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +30: [2023-05-10 12:37:47,931] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +30: [2023-05-10 12:37:47,931] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +30: [2023-05-10 12:37:47,931] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +30: [2023-05-10 12:37:47,932] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt... +30: [2023-05-10 12:37:47,932] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt... +10: [2023-05-10 12:37:47,932] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +10: [2023-05-10 12:37:47,932] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +10: [2023-05-10 12:37:47,932] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +30: [2023-05-10 12:37:47,933] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt... +30: [2023-05-10 12:37:47,933] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +30: [2023-05-10 12:37:47,933] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt... +30: [2023-05-10 12:37:47,933] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +14: [2023-05-10 12:37:47,933] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +15: [2023-05-10 12:37:47,934] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt. +15: [2023-05-10 12:37:47,934] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt. +17: [2023-05-10 12:37:47,936] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. + 8: [2023-05-10 12:37:47,938] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. + 8: [2023-05-10 12:37:47,938] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +17: [2023-05-10 12:37:47,938] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +26: [2023-05-10 12:37:47,938] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +26: [2023-05-10 12:37:47,938] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +26: [2023-05-10 12:37:47,938] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +26: [2023-05-10 12:37:47,938] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +26: [2023-05-10 12:37:47,939] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +26: [2023-05-10 12:37:47,939] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +26: [2023-05-10 12:37:47,939] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +26: [2023-05-10 12:37:47,939] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +26: [2023-05-10 12:37:47,939] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +17: [2023-05-10 12:37:47,939] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +26: [2023-05-10 12:37:47,939] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +26: [2023-05-10 12:37:47,939] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +26: [2023-05-10 12:37:47,939] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt... +26: [2023-05-10 12:37:47,939] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt... +26: [2023-05-10 12:37:47,939] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt... + 8: [2023-05-10 12:37:47,939] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt... + 8: [2023-05-10 12:37:47,939] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt... +15: [2023-05-10 12:37:47,940] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt. +26: [2023-05-10 12:37:47,940] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt... +11: [2023-05-10 12:37:47,940] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +26: [2023-05-10 12:37:47,940] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +15: [2023-05-10 12:37:47,940] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt. + 8: [2023-05-10 12:37:47,940] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... + 8: [2023-05-10 12:37:47,940] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +11: [2023-05-10 12:37:47,941] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +11: [2023-05-10 12:37:47,941] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +11: [2023-05-10 12:37:47,942] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... + 8: [2023-05-10 12:37:47,944] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. + 8: [2023-05-10 12:37:47,944] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt... +17: [2023-05-10 12:37:47,945] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +30: [2023-05-10 12:37:47,946] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +15: [2023-05-10 12:37:47,946] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +15: [2023-05-10 12:37:47,947] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +16: [2023-05-10 12:37:47,948] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +16: [2023-05-10 12:37:47,948] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +16: [2023-05-10 12:37:47,948] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +16: [2023-05-10 12:37:47,948] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +16: [2023-05-10 12:37:47,948] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +16: [2023-05-10 12:37:47,948] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +16: [2023-05-10 12:37:47,949] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +15: [2023-05-10 12:37:47,950] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +16: [2023-05-10 12:37:47,950] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +15: [2023-05-10 12:37:47,950] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +15: [2023-05-10 12:37:47,950] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +15: [2023-05-10 12:37:47,950] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +15: [2023-05-10 12:37:47,950] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... + 8: [2023-05-10 12:37:47,951] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. + 8: [2023-05-10 12:37:47,951] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt... +15: [2023-05-10 12:37:47,951] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +26: [2023-05-10 12:37:47,951] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. + 5: [2023-05-10 12:37:47,951] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt. + 5: [2023-05-10 12:37:47,951] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt. +15: [2023-05-10 12:37:47,952] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +15: [2023-05-10 12:37:47,952] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... + 5: [2023-05-10 12:37:47,952] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt. +15: [2023-05-10 12:37:47,952] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +15: [2023-05-10 12:37:47,952] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... + 5: [2023-05-10 12:37:47,952] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt. +30: [2023-05-10 12:37:47,952] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +26: [2023-05-10 12:37:47,952] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +26: [2023-05-10 12:37:47,952] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +30: [2023-05-10 12:37:47,955] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +27: [2023-05-10 12:37:47,958] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +27: [2023-05-10 12:37:47,958] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +27: [2023-05-10 12:37:47,958] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +27: [2023-05-10 12:37:47,958] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +27: [2023-05-10 12:37:47,958] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +30: [2023-05-10 12:37:47,959] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +27: [2023-05-10 12:37:47,959] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +27: [2023-05-10 12:37:47,960] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +27: [2023-05-10 12:37:47,960] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +26: [2023-05-10 12:37:47,960] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... + 5: [2023-05-10 12:37:47,961] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +30: [2023-05-10 12:37:47,961] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +26: [2023-05-10 12:37:47,962] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +26: [2023-05-10 12:37:47,962] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... + 5: [2023-05-10 12:37:47,963] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +15: [2023-05-10 12:37:47,964] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. + 5: [2023-05-10 12:37:47,965] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +16: [2023-05-10 12:37:47,964] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +16: [2023-05-10 12:37:47,964] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +16: [2023-05-10 12:37:47,964] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. + 5: [2023-05-10 12:37:47,965] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +30: [2023-05-10 12:37:47,965] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +26: [2023-05-10 12:37:47,966] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +15: [2023-05-10 12:37:47,968] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +30: [2023-05-10 12:37:47,968] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +15: [2023-05-10 12:37:47,969] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt... +15: [2023-05-10 12:37:47,970] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +27: [2023-05-10 12:37:47,971] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +15: [2023-05-10 12:37:47,973] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +15: [2023-05-10 12:37:47,973] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +15: [2023-05-10 12:37:47,973] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt... +30: [2023-05-10 12:37:47,973] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... + 0: [2023-05-10 12:37:47,973] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. + 0: [2023-05-10 12:37:47,973] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. + 0: [2023-05-10 12:37:47,974] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. + 0: [2023-05-10 12:37:47,974] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... + 0: [2023-05-10 12:37:47,974] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... + 0: [2023-05-10 12:37:47,974] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. + 0: [2023-05-10 12:37:47,974] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +16: [2023-05-10 12:37:47,974] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +16: [2023-05-10 12:37:47,974] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +16: [2023-05-10 12:37:47,974] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +15: [2023-05-10 12:37:47,975] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +16: [2023-05-10 12:37:47,975] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +15: [2023-05-10 12:37:47,975] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt... +15: [2023-05-10 12:37:47,975] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +26: [2023-05-10 12:37:47,975] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... + 0: [2023-05-10 12:37:47,975] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +15: [2023-05-10 12:37:47,978] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +19: [2023-05-10 12:37:47,977] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +19: [2023-05-10 12:37:47,977] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +19: [2023-05-10 12:37:47,978] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +19: [2023-05-10 12:37:47,978] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +19: [2023-05-10 12:37:47,978] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +19: [2023-05-10 12:37:47,978] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +19: [2023-05-10 12:37:47,979] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +19: [2023-05-10 12:37:47,979] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +15: [2023-05-10 12:37:47,979] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +15: [2023-05-10 12:37:47,979] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt... +27: [2023-05-10 12:37:47,981] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +15: [2023-05-10 12:37:47,982] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +27: [2023-05-10 12:37:47,983] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +16: [2023-05-10 12:37:47,983] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +27: [2023-05-10 12:37:47,983] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +15: [2023-05-10 12:37:47,985] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +27: [2023-05-10 12:37:47,989] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +15: [2023-05-10 12:37:47,990] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +27: [2023-05-10 12:37:47,992] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +27: [2023-05-10 12:37:47,992] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +19: [2023-05-10 12:37:47,994] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +19: [2023-05-10 12:37:47,994] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. + 0: [2023-05-10 12:37:47,995] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. + 0: [2023-05-10 12:37:47,995] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +27: [2023-05-10 12:37:47,997] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +22: [2023-05-10 12:37:47,997] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt. +22: [2023-05-10 12:37:47,997] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt. +22: [2023-05-10 12:37:47,997] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt. +22: [2023-05-10 12:37:47,998] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt. +19: [2023-05-10 12:37:48,002] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. + 0: [2023-05-10 12:37:48,003] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +18: [2023-05-10 12:37:48,004] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt. +18: [2023-05-10 12:37:48,004] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt. +29: [2023-05-10 12:37:48,004] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt. + 0: [2023-05-10 12:37:48,004] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +18: [2023-05-10 12:37:48,005] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt. +19: [2023-05-10 12:37:48,005] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +18: [2023-05-10 12:37:48,005] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt. +21: [2023-05-10 12:37:48,005] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt. +21: [2023-05-10 12:37:48,005] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt. +21: [2023-05-10 12:37:48,005] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt. +29: [2023-05-10 12:37:48,005] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt. + 6: [2023-05-10 12:37:48,005] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt. + 6: [2023-05-10 12:37:48,005] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt. + 6: [2023-05-10 12:37:48,005] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt. +21: [2023-05-10 12:37:48,005] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt. + 6: [2023-05-10 12:37:48,005] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt. +19: [2023-05-10 12:37:48,006] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... + 0: [2023-05-10 12:37:48,007] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt. +19: [2023-05-10 12:37:48,007] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. + 0: [2023-05-10 12:37:48,007] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt. +29: [2023-05-10 12:37:48,007] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt. +29: [2023-05-10 12:37:48,008] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt. + 0: [2023-05-10 12:37:48,008] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... + 7: [2023-05-10 12:37:48,009] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt. + 7: [2023-05-10 12:37:48,009] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt. + 7: [2023-05-10 12:37:48,009] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt. + 7: [2023-05-10 12:37:48,010] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt. +22: [2023-05-10 12:37:48,010] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +19: [2023-05-10 12:37:48,010] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +14: [2023-05-10 12:37:48,010] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt. +22: [2023-05-10 12:37:48,010] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +14: [2023-05-10 12:37:48,011] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt. +14: [2023-05-10 12:37:48,011] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt. + 0: [2023-05-10 12:37:48,011] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt. +14: [2023-05-10 12:37:48,011] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt. + 0: [2023-05-10 12:37:48,012] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt. +22: [2023-05-10 12:37:48,013] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +22: [2023-05-10 12:37:48,013] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... + 6: [2023-05-10 12:37:48,014] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +29: [2023-05-10 12:37:48,014] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +29: [2023-05-10 12:37:48,014] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +19: [2023-05-10 12:37:48,015] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +21: [2023-05-10 12:37:48,015] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... + 6: [2023-05-10 12:37:48,015] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... + 6: [2023-05-10 12:37:48,015] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +18: [2023-05-10 12:37:48,015] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +18: [2023-05-10 12:37:48,015] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +21: [2023-05-10 12:37:48,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +21: [2023-05-10 12:37:48,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +18: [2023-05-10 12:37:48,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +21: [2023-05-10 12:37:48,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +18: [2023-05-10 12:37:48,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +29: [2023-05-10 12:37:48,017] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... + 6: [2023-05-10 12:37:48,017] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... + 0: [2023-05-10 12:37:48,018] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... + 0: [2023-05-10 12:37:48,018] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... + 0: [2023-05-10 12:37:48,018] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +29: [2023-05-10 12:37:48,018] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... + 7: [2023-05-10 12:37:48,019] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +17: [2023-05-10 12:37:48,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt. +17: [2023-05-10 12:37:48,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt. +17: [2023-05-10 12:37:48,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt. + 7: [2023-05-10 12:37:48,019] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +17: [2023-05-10 12:37:48,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt. + 9: [2023-05-10 12:37:48,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. + 9: [2023-05-10 12:37:48,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +23: [2023-05-10 12:37:48,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. + 9: [2023-05-10 12:37:48,020] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... + 9: [2023-05-10 12:37:48,020] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +23: [2023-05-10 12:37:48,020] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +23: [2023-05-10 12:37:48,020] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +23: [2023-05-10 12:37:48,020] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +23: [2023-05-10 12:37:48,020] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. + 7: [2023-05-10 12:37:48,020] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. + 7: [2023-05-10 12:37:48,020] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. + 7: [2023-05-10 12:37:48,020] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +23: [2023-05-10 12:37:48,020] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +23: [2023-05-10 12:37:48,020] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. + 7: [2023-05-10 12:37:48,020] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... + 7: [2023-05-10 12:37:48,020] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... + 7: [2023-05-10 12:37:48,020] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... + 7: [2023-05-10 12:37:48,020] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +23: [2023-05-10 12:37:48,020] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +23: [2023-05-10 12:37:48,020] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +23: [2023-05-10 12:37:48,020] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +23: [2023-05-10 12:37:48,020] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. + 9: [2023-05-10 12:37:48,020] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +23: [2023-05-10 12:37:48,020] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... + 9: [2023-05-10 12:37:48,020] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. + 7: [2023-05-10 12:37:48,020] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... + 9: [2023-05-10 12:37:48,020] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +14: [2023-05-10 12:37:48,020] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +23: [2023-05-10 12:37:48,020] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt... +23: [2023-05-10 12:37:48,021] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt... + 7: [2023-05-10 12:37:48,020] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... + 7: [2023-05-10 12:37:48,021] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +14: [2023-05-10 12:37:48,021] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +13: [2023-05-10 12:37:48,021] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +13: [2023-05-10 12:37:48,021] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +14: [2023-05-10 12:37:48,021] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +13: [2023-05-10 12:37:48,021] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +13: [2023-05-10 12:37:48,021] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +13: [2023-05-10 12:37:48,021] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +13: [2023-05-10 12:37:48,021] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +13: [2023-05-10 12:37:48,021] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +13: [2023-05-10 12:37:48,021] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +14: [2023-05-10 12:37:48,022] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... + 9: [2023-05-10 12:37:48,022] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +20: [2023-05-10 12:37:48,022] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +20: [2023-05-10 12:37:48,022] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +20: [2023-05-10 12:37:48,022] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +20: [2023-05-10 12:37:48,022] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +20: [2023-05-10 12:37:48,022] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +20: [2023-05-10 12:37:48,022] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +23: [2023-05-10 12:37:48,022] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt... +20: [2023-05-10 12:37:48,022] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +23: [2023-05-10 12:37:48,023] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt... + 0: [2023-05-10 12:37:48,023] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +27: [2023-05-10 12:37:48,023] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt. +27: [2023-05-10 12:37:48,023] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt. + 0: [2023-05-10 12:37:48,023] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +20: [2023-05-10 12:37:48,023] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +27: [2023-05-10 12:37:48,023] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt. +27: [2023-05-10 12:37:48,024] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt. + 5: [2023-05-10 12:37:48,024] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. + 5: [2023-05-10 12:37:48,024] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +11: [2023-05-10 12:37:48,024] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +11: [2023-05-10 12:37:48,024] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. + 5: [2023-05-10 12:37:48,024] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. + 5: [2023-05-10 12:37:48,024] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +11: [2023-05-10 12:37:48,024] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +11: [2023-05-10 12:37:48,024] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +11: [2023-05-10 12:37:48,024] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +11: [2023-05-10 12:37:48,024] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. + 5: [2023-05-10 12:37:48,024] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt... +11: [2023-05-10 12:37:48,024] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +11: [2023-05-10 12:37:48,024] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +11: [2023-05-10 12:37:48,024] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +11: [2023-05-10 12:37:48,024] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... + 0: [2023-05-10 12:37:48,024] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +11: [2023-05-10 12:37:48,024] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt... +11: [2023-05-10 12:37:48,024] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt... +11: [2023-05-10 12:37:48,024] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +11: [2023-05-10 12:37:48,024] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt... +11: [2023-05-10 12:37:48,024] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt... + 5: [2023-05-10 12:37:48,024] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. + 5: [2023-05-10 12:37:48,024] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. + 5: [2023-05-10 12:37:48,024] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. + 5: [2023-05-10 12:37:48,025] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... + 5: [2023-05-10 12:37:48,025] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... + 5: [2023-05-10 12:37:48,025] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. + 5: [2023-05-10 12:37:48,025] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt... + 5: [2023-05-10 12:37:48,026] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt... + 5: [2023-05-10 12:37:48,026] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +11: [2023-05-10 12:37:48,026] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... + 1: [2023-05-10 12:37:48,026] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. + 1: [2023-05-10 12:37:48,026] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. + 1: [2023-05-10 12:37:48,026] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... + 5: [2023-05-10 12:37:48,026] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... + 5: [2023-05-10 12:37:48,026] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt... + 1: [2023-05-10 12:37:48,027] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt... + 1: [2023-05-10 12:37:48,027] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. + 1: [2023-05-10 12:37:48,027] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. + 1: [2023-05-10 12:37:48,027] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. + 1: [2023-05-10 12:37:48,027] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. + 1: [2023-05-10 12:37:48,027] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. + 1: [2023-05-10 12:37:48,027] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. + 1: [2023-05-10 12:37:48,027] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... + 1: [2023-05-10 12:37:48,028] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt... + 1: [2023-05-10 12:37:48,028] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt... +10: [2023-05-10 12:37:48,028] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +10: [2023-05-10 12:37:48,028] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +17: [2023-05-10 12:37:48,029] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +10: [2023-05-10 12:37:48,028] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +10: [2023-05-10 12:37:48,028] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +10: [2023-05-10 12:37:48,029] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +10: [2023-05-10 12:37:48,029] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt... +10: [2023-05-10 12:37:48,029] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt... +10: [2023-05-10 12:37:48,029] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +10: [2023-05-10 12:37:48,029] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt... +10: [2023-05-10 12:37:48,029] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt... +10: [2023-05-10 12:37:48,029] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +10: [2023-05-10 12:37:48,029] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. + 1: [2023-05-10 12:37:48,029] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +22: [2023-05-10 12:37:48,029] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +10: [2023-05-10 12:37:48,029] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +22: [2023-05-10 12:37:48,029] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +10: [2023-05-10 12:37:48,029] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... + 1: [2023-05-10 12:37:48,029] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt... +22: [2023-05-10 12:37:48,029] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +22: [2023-05-10 12:37:48,029] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +22: [2023-05-10 12:37:48,029] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +22: [2023-05-10 12:37:48,029] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +22: [2023-05-10 12:37:48,029] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +22: [2023-05-10 12:37:48,029] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt... + 4: [2023-05-10 12:37:48,029] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +22: [2023-05-10 12:37:48,029] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt... +22: [2023-05-10 12:37:48,029] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +22: [2023-05-10 12:37:48,029] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +22: [2023-05-10 12:37:48,029] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... + 4: [2023-05-10 12:37:48,030] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. + 4: [2023-05-10 12:37:48,030] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... + 4: [2023-05-10 12:37:48,030] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... + 4: [2023-05-10 12:37:48,030] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. + 4: [2023-05-10 12:37:48,030] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +17: [2023-05-10 12:37:48,030] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... + 1: [2023-05-10 12:37:48,030] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +18: [2023-05-10 12:37:48,029] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +18: [2023-05-10 12:37:48,029] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +18: [2023-05-10 12:37:48,029] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +18: [2023-05-10 12:37:48,029] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +18: [2023-05-10 12:37:48,030] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +18: [2023-05-10 12:37:48,030] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +18: [2023-05-10 12:37:48,030] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +18: [2023-05-10 12:37:48,030] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +10: [2023-05-10 12:37:48,030] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +23: [2023-05-10 12:37:48,030] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +17: [2023-05-10 12:37:48,031] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +10: [2023-05-10 12:37:48,031] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +17: [2023-05-10 12:37:48,031] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... + 4: [2023-05-10 12:37:48,031] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +29: [2023-05-10 12:37:48,031] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +25: [2023-05-10 12:37:48,031] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +29: [2023-05-10 12:37:48,031] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +29: [2023-05-10 12:37:48,031] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +29: [2023-05-10 12:37:48,031] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +25: [2023-05-10 12:37:48,031] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +18: [2023-05-10 12:37:48,031] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +18: [2023-05-10 12:37:48,031] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +25: [2023-05-10 12:37:48,031] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +25: [2023-05-10 12:37:48,031] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +23: [2023-05-10 12:37:48,031] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +25: [2023-05-10 12:37:48,031] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +25: [2023-05-10 12:37:48,031] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +25: [2023-05-10 12:37:48,031] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +25: [2023-05-10 12:37:48,032] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +18: [2023-05-10 12:37:48,032] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt... +18: [2023-05-10 12:37:48,032] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt... +29: [2023-05-10 12:37:48,032] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +29: [2023-05-10 12:37:48,032] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +13: [2023-05-10 12:37:48,032] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. + 4: [2023-05-10 12:37:48,032] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... + 7: [2023-05-10 12:37:48,032] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. + 7: [2023-05-10 12:37:48,033] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt... +14: [2023-05-10 12:37:48,033] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. + 0: [2023-05-10 12:37:48,033] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +27: [2023-05-10 12:37:48,033] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +27: [2023-05-10 12:37:48,033] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +27: [2023-05-10 12:37:48,033] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +29: [2023-05-10 12:37:48,033] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +14: [2023-05-10 12:37:48,034] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt... +29: [2023-05-10 12:37:48,034] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... + 9: [2023-05-10 12:37:48,034] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +27: [2023-05-10 12:37:48,034] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... + 9: [2023-05-10 12:37:48,034] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. + 9: [2023-05-10 12:37:48,034] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +23: [2023-05-10 12:37:48,034] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +14: [2023-05-10 12:37:48,034] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. + 6: [2023-05-10 12:37:48,034] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +14: [2023-05-10 12:37:48,035] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt... + 6: [2023-05-10 12:37:48,035] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... + 6: [2023-05-10 12:37:48,035] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +23: [2023-05-10 12:37:48,035] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. + 6: [2023-05-10 12:37:48,035] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. + 6: [2023-05-10 12:37:48,035] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. + 6: [2023-05-10 12:37:48,035] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... + 6: [2023-05-10 12:37:48,035] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +21: [2023-05-10 12:37:48,036] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +21: [2023-05-10 12:37:48,036] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. + 3: [2023-05-10 12:37:48,036] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +21: [2023-05-10 12:37:48,036] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt... +21: [2023-05-10 12:37:48,036] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +21: [2023-05-10 12:37:48,036] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt... + 6: [2023-05-10 12:37:48,036] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +21: [2023-05-10 12:37:48,036] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +21: [2023-05-10 12:37:48,036] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +14: [2023-05-10 12:37:48,036] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. + 3: [2023-05-10 12:37:48,036] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. + 3: [2023-05-10 12:37:48,036] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +21: [2023-05-10 12:37:48,036] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. + 3: [2023-05-10 12:37:48,036] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. + 3: [2023-05-10 12:37:48,036] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +21: [2023-05-10 12:37:48,036] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +21: [2023-05-10 12:37:48,036] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +22: [2023-05-10 12:37:48,036] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +14: [2023-05-10 12:37:48,036] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt... +21: [2023-05-10 12:37:48,036] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +21: [2023-05-10 12:37:48,036] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +21: [2023-05-10 12:37:48,037] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt... +22: [2023-05-10 12:37:48,037] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt... + 3: [2023-05-10 12:37:48,036] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. + 3: [2023-05-10 12:37:48,037] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +21: [2023-05-10 12:37:48,037] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt... +21: [2023-05-10 12:37:48,037] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. + 3: [2023-05-10 12:37:48,037] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. + 3: [2023-05-10 12:37:48,037] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. + 3: [2023-05-10 12:37:48,037] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... + 3: [2023-05-10 12:37:48,037] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +21: [2023-05-10 12:37:48,037] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... + 3: [2023-05-10 12:37:48,037] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt... + 6: [2023-05-10 12:37:48,037] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. + 3: [2023-05-10 12:37:48,037] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt... + 6: [2023-05-10 12:37:48,037] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt... +20: [2023-05-10 12:37:48,037] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +20: [2023-05-10 12:37:48,037] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +20: [2023-05-10 12:37:48,038] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. + 6: [2023-05-10 12:37:48,038] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. + 6: [2023-05-10 12:37:48,038] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt... + 3: [2023-05-10 12:37:48,038] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt... +29: [2023-05-10 12:37:48,038] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. + 3: [2023-05-10 12:37:48,038] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... + 0: [2023-05-10 12:37:48,039] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. + 3: [2023-05-10 12:37:48,039] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt... +29: [2023-05-10 12:37:48,039] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt... + 7: [2023-05-10 12:37:48,039] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. + 7: [2023-05-10 12:37:48,039] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. + 7: [2023-05-10 12:37:48,039] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt... + 1: [2023-05-10 12:37:48,040] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +11: [2023-05-10 12:37:48,039] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. + 0: [2023-05-10 12:37:48,040] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt... +11: [2023-05-10 12:37:48,040] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +11: [2023-05-10 12:37:48,040] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +18: [2023-05-10 12:37:48,040] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +18: [2023-05-10 12:37:48,040] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt... +13: [2023-05-10 12:37:48,040] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +13: [2023-05-10 12:37:48,040] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +13: [2023-05-10 12:37:48,040] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +10: [2023-05-10 12:37:48,040] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +13: [2023-05-10 12:37:48,040] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. + 6: [2023-05-10 12:37:48,040] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +23: [2023-05-10 12:37:48,041] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... + 1: [2023-05-10 12:37:48,041] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. + 6: [2023-05-10 12:37:48,041] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt... +23: [2023-05-10 12:37:48,041] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +22: [2023-05-10 12:37:48,041] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. + 0: [2023-05-10 12:37:48,041] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +29: [2023-05-10 12:37:48,041] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +29: [2023-05-10 12:37:48,041] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt... + 0: [2023-05-10 12:37:48,042] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt... + 4: [2023-05-10 12:37:48,041] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +22: [2023-05-10 12:37:48,042] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. + 5: [2023-05-10 12:37:48,042] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. + 5: [2023-05-10 12:37:48,042] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +29: [2023-05-10 12:37:48,042] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +29: [2023-05-10 12:37:48,042] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +29: [2023-05-10 12:37:48,042] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt... +14: [2023-05-10 12:37:48,043] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +14: [2023-05-10 12:37:48,043] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt... + 9: [2023-05-10 12:37:48,043] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... + 9: [2023-05-10 12:37:48,043] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. + 9: [2023-05-10 12:37:48,043] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +29: [2023-05-10 12:37:48,043] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt... +25: [2023-05-10 12:37:48,043] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +25: [2023-05-10 12:37:48,043] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. + 7: [2023-05-10 12:37:48,044] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +29: [2023-05-10 12:37:48,044] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. + 7: [2023-05-10 12:37:48,044] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +22: [2023-05-10 12:37:48,044] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt... + 7: [2023-05-10 12:37:48,044] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. + 9: [2023-05-10 12:37:48,044] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... + 6: [2023-05-10 12:37:48,044] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. + 6: [2023-05-10 12:37:48,045] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt... + 0: [2023-05-10 12:37:48,045] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. + 0: [2023-05-10 12:37:48,045] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt... +23: [2023-05-10 12:37:48,045] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +17: [2023-05-10 12:37:48,045] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +17: [2023-05-10 12:37:48,045] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt... + 7: [2023-05-10 12:37:48,045] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. + 7: [2023-05-10 12:37:48,046] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt... +10: [2023-05-10 12:37:48,045] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +17: [2023-05-10 12:37:48,046] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +23: [2023-05-10 12:37:48,046] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +17: [2023-05-10 12:37:48,046] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +17: [2023-05-10 12:37:48,046] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt... +17: [2023-05-10 12:37:48,046] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt... +25: [2023-05-10 12:37:48,047] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +25: [2023-05-10 12:37:48,047] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. + 4: [2023-05-10 12:37:48,047] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. + 4: [2023-05-10 12:37:48,047] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +27: [2023-05-10 12:37:48,047] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +20: [2023-05-10 12:37:48,047] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +20: [2023-05-10 12:37:48,047] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +27: [2023-05-10 12:37:48,047] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt... +20: [2023-05-10 12:37:48,048] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +27: [2023-05-10 12:37:48,048] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +27: [2023-05-10 12:37:48,049] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt... +11: [2023-05-10 12:37:48,049] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... + 3: [2023-05-10 12:37:48,049] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +29: [2023-05-10 12:37:48,049] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +29: [2023-05-10 12:37:48,049] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. + 4: [2023-05-10 12:37:48,050] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +10: [2023-05-10 12:37:48,050] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... + 0: [2023-05-10 12:37:48,050] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. + 0: [2023-05-10 12:37:48,050] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt... +13: [2023-05-10 12:37:48,050] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +13: [2023-05-10 12:37:48,050] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... + 5: [2023-05-10 12:37:48,050] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +18: [2023-05-10 12:37:48,050] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +18: [2023-05-10 12:37:48,050] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt... +22: [2023-05-10 12:37:48,050] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +22: [2023-05-10 12:37:48,050] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +22: [2023-05-10 12:37:48,050] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +20: [2023-05-10 12:37:48,050] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. + 6: [2023-05-10 12:37:48,050] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. + 7: [2023-05-10 12:37:48,051] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +29: [2023-05-10 12:37:48,051] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. + 1: [2023-05-10 12:37:48,051] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... + 5: [2023-05-10 12:37:48,051] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. + 1: [2023-05-10 12:37:48,051] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +11: [2023-05-10 12:37:48,051] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +21: [2023-05-10 12:37:48,051] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +21: [2023-05-10 12:37:48,052] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +11: [2023-05-10 12:37:48,052] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +25: [2023-05-10 12:37:48,052] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... + 5: [2023-05-10 12:37:48,052] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... + 2: [2023-05-10 12:37:48,052] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. + 2: [2023-05-10 12:37:48,053] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... + 2: [2023-05-10 12:37:48,053] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. + 2: [2023-05-10 12:37:48,053] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... + 2: [2023-05-10 12:37:48,053] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. + 2: [2023-05-10 12:37:48,053] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +29: [2023-05-10 12:37:48,053] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... + 6: [2023-05-10 12:37:48,054] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. + 9: [2023-05-10 12:37:48,054] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +27: [2023-05-10 12:37:48,054] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +27: [2023-05-10 12:37:48,054] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt... + 2: [2023-05-10 12:37:48,054] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... + 2: [2023-05-10 12:37:48,054] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... + 6: [2023-05-10 12:37:48,055] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +13: [2023-05-10 12:37:48,055] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +27: [2023-05-10 12:37:48,055] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +21: [2023-05-10 12:37:48,055] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +21: [2023-05-10 12:37:48,055] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +25: [2023-05-10 12:37:48,055] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +22: [2023-05-10 12:37:48,056] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... + 1: [2023-05-10 12:37:48,055] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +27: [2023-05-10 12:37:48,056] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt... +25: [2023-05-10 12:37:48,056] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... + 5: [2023-05-10 12:37:48,056] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. + 4: [2023-05-10 12:37:48,056] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... + 3: [2023-05-10 12:37:48,056] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +11: [2023-05-10 12:37:48,056] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. + 3: [2023-05-10 12:37:48,056] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. + 7: [2023-05-10 12:37:48,057] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +17: [2023-05-10 12:37:48,057] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. + 7: [2023-05-10 12:37:48,058] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +10: [2023-05-10 12:37:48,058] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... + 7: [2023-05-10 12:37:48,058] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +25: [2023-05-10 12:37:48,058] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... + 4: [2023-05-10 12:37:48,058] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +17: [2023-05-10 12:37:48,059] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt... + 7: [2023-05-10 12:37:48,059] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +20: [2023-05-10 12:37:48,059] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +10: [2023-05-10 12:37:48,060] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +10: [2023-05-10 12:37:48,060] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. + 5: [2023-05-10 12:37:48,060] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +18: [2023-05-10 12:37:48,060] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +18: [2023-05-10 12:37:48,060] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +18: [2023-05-10 12:37:48,060] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +18: [2023-05-10 12:37:48,060] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. + 7: [2023-05-10 12:37:48,061] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt... + 3: [2023-05-10 12:37:48,061] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +21: [2023-05-10 12:37:48,062] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... + 1: [2023-05-10 12:37:48,062] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +22: [2023-05-10 12:37:48,062] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... + 4: [2023-05-10 12:37:48,062] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +24: [2023-05-10 12:37:48,062] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +21: [2023-05-10 12:37:48,062] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +24: [2023-05-10 12:37:48,062] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +24: [2023-05-10 12:37:48,063] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +24: [2023-05-10 12:37:48,062] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +24: [2023-05-10 12:37:48,063] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +24: [2023-05-10 12:37:48,063] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +24: [2023-05-10 12:37:48,063] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +29: [2023-05-10 12:37:48,063] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... + 1: [2023-05-10 12:37:48,064] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +21: [2023-05-10 12:37:48,065] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +11: [2023-05-10 12:37:48,065] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +21: [2023-05-10 12:37:48,065] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +22: [2023-05-10 12:37:48,065] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +24: [2023-05-10 12:37:48,065] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +29: [2023-05-10 12:37:48,065] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... + 5: [2023-05-10 12:37:48,065] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +29: [2023-05-10 12:37:48,065] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... + 6: [2023-05-10 12:37:48,066] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +22: [2023-05-10 12:37:48,066] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... + 6: [2023-05-10 12:37:48,067] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... + 6: [2023-05-10 12:37:48,067] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... + 6: [2023-05-10 12:37:48,067] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... + 3: [2023-05-10 12:37:48,068] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... + 3: [2023-05-10 12:37:48,068] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... + 2: [2023-05-10 12:37:48,069] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +10: [2023-05-10 12:37:48,069] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +10: [2023-05-10 12:37:48,069] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +18: [2023-05-10 12:37:48,070] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +18: [2023-05-10 12:37:48,070] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +14: [2023-05-10 12:37:48,070] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +14: [2023-05-10 12:37:48,070] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +14: [2023-05-10 12:37:48,070] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +14: [2023-05-10 12:37:48,071] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +14: [2023-05-10 12:37:48,071] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +14: [2023-05-10 12:37:48,071] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +14: [2023-05-10 12:37:48,071] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +18: [2023-05-10 12:37:48,071] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... + 1: [2023-05-10 12:37:48,071] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +14: [2023-05-10 12:37:48,071] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... + 4: [2023-05-10 12:37:48,071] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... + 3: [2023-05-10 12:37:48,072] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. + 2: [2023-05-10 12:37:48,074] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt. + 2: [2023-05-10 12:37:48,074] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt. +18: [2023-05-10 12:37:48,074] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... + 6: [2023-05-10 12:37:48,075] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... + 2: [2023-05-10 12:37:48,074] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt. + 2: [2023-05-10 12:37:48,075] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +24: [2023-05-10 12:37:48,074] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +24: [2023-05-10 12:37:48,075] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +24: [2023-05-10 12:37:48,075] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. + 2: [2023-05-10 12:37:48,078] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt. + 2: [2023-05-10 12:37:48,078] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... + 2: [2023-05-10 12:37:48,081] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +19: [2023-05-10 12:37:48,081] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt. +19: [2023-05-10 12:37:48,081] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt. +19: [2023-05-10 12:37:48,081] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt. +19: [2023-05-10 12:37:48,081] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt. +14: [2023-05-10 12:37:48,082] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. + 2: [2023-05-10 12:37:48,082] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. + 3: [2023-05-10 12:37:48,083] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +14: [2023-05-10 12:37:48,083] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +12: [2023-05-10 12:37:48,083] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt. +12: [2023-05-10 12:37:48,083] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt. +12: [2023-05-10 12:37:48,083] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt. +12: [2023-05-10 12:37:48,083] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt. +25: [2023-05-10 12:37:48,083] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt. +25: [2023-05-10 12:37:48,083] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt. +25: [2023-05-10 12:37:48,084] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt. +25: [2023-05-10 12:37:48,084] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt. + 2: [2023-05-10 12:37:48,085] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... + 2: [2023-05-10 12:37:48,085] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +24: [2023-05-10 12:37:48,085] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +14: [2023-05-10 12:37:48,085] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +14: [2023-05-10 12:37:48,086] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. + 9: [2023-05-10 12:37:48,086] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt. + 9: [2023-05-10 12:37:48,086] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt. + 2: [2023-05-10 12:37:48,086] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... + 9: [2023-05-10 12:37:48,086] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt. +20: [2023-05-10 12:37:48,086] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt. + 9: [2023-05-10 12:37:48,086] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt. +20: [2023-05-10 12:37:48,086] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt. +20: [2023-05-10 12:37:48,086] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt. +31: [2023-05-10 12:37:48,086] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +31: [2023-05-10 12:37:48,086] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +20: [2023-05-10 12:37:48,086] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt. +31: [2023-05-10 12:37:48,086] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +31: [2023-05-10 12:37:48,086] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... + 2: [2023-05-10 12:37:48,087] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +31: [2023-05-10 12:37:48,087] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +31: [2023-05-10 12:37:48,087] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +24: [2023-05-10 12:37:48,087] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +24: [2023-05-10 12:37:48,088] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +31: [2023-05-10 12:37:48,088] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +31: [2023-05-10 12:37:48,088] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... + 2: [2023-05-10 12:37:48,089] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... + 2: [2023-05-10 12:37:48,091] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. + 2: [2023-05-10 12:37:48,091] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +19: [2023-05-10 12:37:48,091] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... + 2: [2023-05-10 12:37:48,091] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... + 2: [2023-05-10 12:37:48,092] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. + 2: [2023-05-10 12:37:48,092] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +14: [2023-05-10 12:37:48,092] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... + 2: [2023-05-10 12:37:48,092] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... + 2: [2023-05-10 12:37:48,092] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +12: [2023-05-10 12:37:48,092] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... + 2: [2023-05-10 12:37:48,092] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. + 2: [2023-05-10 12:37:48,092] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. + 2: [2023-05-10 12:37:48,092] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +12: [2023-05-10 12:37:48,092] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +19: [2023-05-10 12:37:48,093] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... + 2: [2023-05-10 12:37:48,093] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. + 2: [2023-05-10 12:37:48,093] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. + 2: [2023-05-10 12:37:48,093] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +24: [2023-05-10 12:37:48,093] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +24: [2023-05-10 12:37:48,093] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +24: [2023-05-10 12:37:48,093] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +24: [2023-05-10 12:37:48,093] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... + 2: [2023-05-10 12:37:48,093] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +25: [2023-05-10 12:37:48,093] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +24: [2023-05-10 12:37:48,093] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +25: [2023-05-10 12:37:48,093] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +24: [2023-05-10 12:37:48,093] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +25: [2023-05-10 12:37:48,094] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +14: [2023-05-10 12:37:48,094] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +24: [2023-05-10 12:37:48,094] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +24: [2023-05-10 12:37:48,094] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +24: [2023-05-10 12:37:48,094] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +12: [2023-05-10 12:37:48,094] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +16: [2023-05-10 12:37:48,094] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt. +16: [2023-05-10 12:37:48,094] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt. +16: [2023-05-10 12:37:48,094] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt. +16: [2023-05-10 12:37:48,095] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt. +25: [2023-05-10 12:37:48,095] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +14: [2023-05-10 12:37:48,095] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +31: [2023-05-10 12:37:48,095] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt. +12: [2023-05-10 12:37:48,095] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +19: [2023-05-10 12:37:48,095] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +20: [2023-05-10 12:37:48,095] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +20: [2023-05-10 12:37:48,095] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +31: [2023-05-10 12:37:48,095] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt. +31: [2023-05-10 12:37:48,095] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt. +19: [2023-05-10 12:37:48,095] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +31: [2023-05-10 12:37:48,096] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt. +24: [2023-05-10 12:37:48,096] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +14: [2023-05-10 12:37:48,097] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +14: [2023-05-10 12:37:48,097] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +14: [2023-05-10 12:37:48,097] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +14: [2023-05-10 12:37:48,097] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... + 4: [2023-05-10 12:37:48,097] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt. + 4: [2023-05-10 12:37:48,097] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt. + 9: [2023-05-10 12:37:48,097] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... + 9: [2023-05-10 12:37:48,097] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +14: [2023-05-10 12:37:48,097] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +14: [2023-05-10 12:37:48,097] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +14: [2023-05-10 12:37:48,097] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... + 4: [2023-05-10 12:37:48,097] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt. + 4: [2023-05-10 12:37:48,097] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt. + 9: [2023-05-10 12:37:48,098] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +14: [2023-05-10 12:37:48,098] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +14: [2023-05-10 12:37:48,098] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +14: [2023-05-10 12:37:48,098] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +14: [2023-05-10 12:37:48,098] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +14: [2023-05-10 12:37:48,098] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +20: [2023-05-10 12:37:48,098] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +20: [2023-05-10 12:37:48,098] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +14: [2023-05-10 12:37:48,098] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +31: [2023-05-10 12:37:48,099] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. + 9: [2023-05-10 12:37:48,100] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... + 2: [2023-05-10 12:37:48,103] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. + 2: [2023-05-10 12:37:48,103] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt... +16: [2023-05-10 12:37:48,104] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +16: [2023-05-10 12:37:48,104] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +16: [2023-05-10 12:37:48,104] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +16: [2023-05-10 12:37:48,104] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +31: [2023-05-10 12:37:48,104] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... + 2: [2023-05-10 12:37:48,104] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. + 2: [2023-05-10 12:37:48,104] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. + 2: [2023-05-10 12:37:48,105] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt... +13: [2023-05-10 12:37:48,104] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt. + 2: [2023-05-10 12:37:48,105] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt... +12: [2023-05-10 12:37:48,104] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +13: [2023-05-10 12:37:48,105] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt. +13: [2023-05-10 12:37:48,105] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt. +13: [2023-05-10 12:37:48,105] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_34-model_01-model_states.pt. +12: [2023-05-10 12:37:48,105] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt... +24: [2023-05-10 12:37:48,105] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +24: [2023-05-10 12:37:48,106] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +24: [2023-05-10 12:37:48,106] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... + 8: [2023-05-10 12:37:48,106] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. + 8: [2023-05-10 12:37:48,106] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. + 8: [2023-05-10 12:37:48,106] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. + 8: [2023-05-10 12:37:48,106] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... + 8: [2023-05-10 12:37:48,106] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +19: [2023-05-10 12:37:48,105] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. + 8: [2023-05-10 12:37:48,106] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +24: [2023-05-10 12:37:48,106] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +31: [2023-05-10 12:37:48,106] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +31: [2023-05-10 12:37:48,106] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +19: [2023-05-10 12:37:48,106] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt... + 4: [2023-05-10 12:37:48,106] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +31: [2023-05-10 12:37:48,107] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... + 4: [2023-05-10 12:37:48,107] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +20: [2023-05-10 12:37:48,107] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +20: [2023-05-10 12:37:48,108] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt... +31: [2023-05-10 12:37:48,108] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +25: [2023-05-10 12:37:48,108] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +25: [2023-05-10 12:37:48,108] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +25: [2023-05-10 12:37:48,108] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt... +25: [2023-05-10 12:37:48,108] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt... + 4: [2023-05-10 12:37:48,108] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... + 4: [2023-05-10 12:37:48,108] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +31: [2023-05-10 12:37:48,109] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... + 8: [2023-05-10 12:37:48,109] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. + 8: [2023-05-10 12:37:48,109] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +20: [2023-05-10 12:37:48,109] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +20: [2023-05-10 12:37:48,109] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt... +25: [2023-05-10 12:37:48,110] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +25: [2023-05-10 12:37:48,110] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt... +24: [2023-05-10 12:37:48,111] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt. +24: [2023-05-10 12:37:48,111] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt. +24: [2023-05-10 12:37:48,111] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt. +24: [2023-05-10 12:37:48,111] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt. +31: [2023-05-10 12:37:48,112] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +31: [2023-05-10 12:37:48,112] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +31: [2023-05-10 12:37:48,113] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +12: [2023-05-10 12:37:48,113] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +12: [2023-05-10 12:37:48,113] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt... +31: [2023-05-10 12:37:48,115] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... + 9: [2023-05-10 12:37:48,115] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. + 9: [2023-05-10 12:37:48,115] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. + 9: [2023-05-10 12:37:48,116] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt... + 9: [2023-05-10 12:37:48,116] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt... +31: [2023-05-10 12:37:48,116] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +13: [2023-05-10 12:37:48,116] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +19: [2023-05-10 12:37:48,116] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +31: [2023-05-10 12:37:48,116] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... + 9: [2023-05-10 12:37:48,116] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. + 2: [2023-05-10 12:37:48,116] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. + 9: [2023-05-10 12:37:48,116] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt... +13: [2023-05-10 12:37:48,116] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +31: [2023-05-10 12:37:48,116] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +13: [2023-05-10 12:37:48,117] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +25: [2023-05-10 12:37:48,116] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +13: [2023-05-10 12:37:48,117] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt... +19: [2023-05-10 12:37:48,117] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt... +20: [2023-05-10 12:37:48,117] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +20: [2023-05-10 12:37:48,117] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt... + 8: [2023-05-10 12:37:48,117] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +25: [2023-05-10 12:37:48,118] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt... + 2: [2023-05-10 12:37:48,118] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt... +12: [2023-05-10 12:37:48,119] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +12: [2023-05-10 12:37:48,119] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +16: [2023-05-10 12:37:48,119] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +19: [2023-05-10 12:37:48,119] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +16: [2023-05-10 12:37:48,120] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +16: [2023-05-10 12:37:48,120] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +16: [2023-05-10 12:37:48,120] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt... +16: [2023-05-10 12:37:48,120] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +16: [2023-05-10 12:37:48,120] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt... +16: [2023-05-10 12:37:48,120] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt... +24: [2023-05-10 12:37:48,120] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +16: [2023-05-10 12:37:48,120] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt... +24: [2023-05-10 12:37:48,120] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +24: [2023-05-10 12:37:48,121] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +12: [2023-05-10 12:37:48,121] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt... +19: [2023-05-10 12:37:48,121] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt... +24: [2023-05-10 12:37:48,121] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +12: [2023-05-10 12:37:48,121] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt... + 4: [2023-05-10 12:37:48,122] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. + 4: [2023-05-10 12:37:48,122] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt... +31: [2023-05-10 12:37:48,122] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +31: [2023-05-10 12:37:48,123] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +20: [2023-05-10 12:37:48,122] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +31: [2023-05-10 12:37:48,123] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt... +20: [2023-05-10 12:37:48,124] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt... +19: [2023-05-10 12:37:48,124] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +31: [2023-05-10 12:37:48,125] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. + 9: [2023-05-10 12:37:48,125] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +19: [2023-05-10 12:37:48,125] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt... +31: [2023-05-10 12:37:48,125] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. + 8: [2023-05-10 12:37:48,126] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. + 8: [2023-05-10 12:37:48,126] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +31: [2023-05-10 12:37:48,126] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt... + 9: [2023-05-10 12:37:48,127] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt... +31: [2023-05-10 12:37:48,128] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +31: [2023-05-10 12:37:48,128] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. + 4: [2023-05-10 12:37:48,127] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. + 4: [2023-05-10 12:37:48,128] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt... +31: [2023-05-10 12:37:48,128] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt... +31: [2023-05-10 12:37:48,128] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt... +30: [2023-05-10 12:37:48,128] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt. +30: [2023-05-10 12:37:48,128] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt. +30: [2023-05-10 12:37:48,128] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt. + 4: [2023-05-10 12:37:48,128] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. + 4: [2023-05-10 12:37:48,128] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt... + 2: [2023-05-10 12:37:48,129] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt... + 2: [2023-05-10 12:37:48,129] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_8_mp_rank_00_optim_states.pt... + 2: [2023-05-10 12:37:48,130] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_9_mp_rank_00_optim_states.pt... + 2: [2023-05-10 12:37:48,130] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt... +14: [2023-05-10 12:37:48,130] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_56_mp_rank_00_optim_states.pt... +14: [2023-05-10 12:37:48,130] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_57_mp_rank_00_optim_states.pt... +14: [2023-05-10 12:37:48,130] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_58_mp_rank_00_optim_states.pt... +14: [2023-05-10 12:37:48,130] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_59_mp_rank_00_optim_states.pt... +13: [2023-05-10 12:37:48,130] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. + 8: [2023-05-10 12:37:48,130] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +13: [2023-05-10 12:37:48,131] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt... +31: [2023-05-10 12:37:48,131] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +31: [2023-05-10 12:37:48,132] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +31: [2023-05-10 12:37:48,132] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +31: [2023-05-10 12:37:48,132] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. + 8: [2023-05-10 12:37:48,133] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +13: [2023-05-10 12:37:48,134] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +13: [2023-05-10 12:37:48,134] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +13: [2023-05-10 12:37:48,134] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt... +13: [2023-05-10 12:37:48,134] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt... + 4: [2023-05-10 12:37:48,134] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +24: [2023-05-10 12:37:48,135] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +24: [2023-05-10 12:37:48,135] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +24: [2023-05-10 12:37:48,136] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt... +24: [2023-05-10 12:37:48,136] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt... + 4: [2023-05-10 12:37:48,136] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt... + 8: [2023-05-10 12:37:48,136] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. + 8: [2023-05-10 12:37:48,136] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +31: [2023-05-10 12:37:48,136] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +24: [2023-05-10 12:37:48,136] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +24: [2023-05-10 12:37:48,136] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt... + 8: [2023-05-10 12:37:48,137] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +31: [2023-05-10 12:37:48,137] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +31: [2023-05-10 12:37:48,137] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +31: [2023-05-10 12:37:48,137] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +24: [2023-05-10 12:37:48,138] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. + 8: [2023-05-10 12:37:48,138] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... + 8: [2023-05-10 12:37:48,138] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... + 8: [2023-05-10 12:37:48,139] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. + 8: [2023-05-10 12:37:48,139] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. + 8: [2023-05-10 12:37:48,139] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... + 8: [2023-05-10 12:37:48,139] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... + 8: [2023-05-10 12:37:48,139] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. + 8: [2023-05-10 12:37:48,139] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +24: [2023-05-10 12:37:48,139] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt... +13: [2023-05-10 12:37:48,140] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_00-model_states.pt. +24: [2023-05-10 12:37:48,140] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_97_mp_rank_00_optim_states.pt... +24: [2023-05-10 12:37:48,140] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_98_mp_rank_00_optim_states.pt... +24: [2023-05-10 12:37:48,140] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_96_mp_rank_00_optim_states.pt... +24: [2023-05-10 12:37:48,140] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_99_mp_rank_00_optim_states.pt... +13: [2023-05-10 12:37:48,141] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt... +26: [2023-05-10 12:37:48,141] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +26: [2023-05-10 12:37:48,142] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +26: [2023-05-10 12:37:48,142] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +26: [2023-05-10 12:37:48,142] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +26: [2023-05-10 12:37:48,142] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +26: [2023-05-10 12:37:48,142] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +26: [2023-05-10 12:37:48,142] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +26: [2023-05-10 12:37:48,143] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... + 8: [2023-05-10 12:37:48,145] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +28: [2023-05-10 12:37:48,145] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. + 8: [2023-05-10 12:37:48,145] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +28: [2023-05-10 12:37:48,145] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... + 8: [2023-05-10 12:37:48,145] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... + 8: [2023-05-10 12:37:48,146] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +28: [2023-05-10 12:37:48,147] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +28: [2023-05-10 12:37:48,148] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +28: [2023-05-10 12:37:48,150] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +28: [2023-05-10 12:37:48,150] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +28: [2023-05-10 12:37:48,150] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +31: [2023-05-10 12:37:48,152] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_125_mp_rank_00_optim_states.pt... +31: [2023-05-10 12:37:48,152] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_126_mp_rank_00_optim_states.pt... +31: [2023-05-10 12:37:48,152] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_127_mp_rank_00_optim_states.pt... +31: [2023-05-10 12:37:48,152] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_124_mp_rank_00_optim_states.pt... +28: [2023-05-10 12:37:48,152] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +26: [2023-05-10 12:37:48,154] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +26: [2023-05-10 12:37:48,155] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +26: [2023-05-10 12:37:48,156] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +26: [2023-05-10 12:37:48,161] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt. +26: [2023-05-10 12:37:48,161] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt. +26: [2023-05-10 12:37:48,161] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt. +26: [2023-05-10 12:37:48,161] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt. +28: [2023-05-10 12:37:48,162] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +26: [2023-05-10 12:37:48,163] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +28: [2023-05-10 12:37:48,168] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +26: [2023-05-10 12:37:48,169] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +26: [2023-05-10 12:37:48,169] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +28: [2023-05-10 12:37:48,171] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +26: [2023-05-10 12:37:48,171] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +30: [2023-05-10 12:37:48,128] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt. +28: [2023-05-10 12:37:48,171] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +30: [2023-05-10 12:37:48,137] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +30: [2023-05-10 12:37:48,138] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +30: [2023-05-10 12:37:48,138] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +30: [2023-05-10 12:37:48,138] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +30: [2023-05-10 12:37:48,151] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +30: [2023-05-10 12:37:48,151] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +30: [2023-05-10 12:37:48,151] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +30: [2023-05-10 12:37:48,151] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +30: [2023-05-10 12:37:48,151] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +30: [2023-05-10 12:37:48,151] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +30: [2023-05-10 12:37:48,151] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +30: [2023-05-10 12:37:48,151] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +30: [2023-05-10 12:37:48,151] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +30: [2023-05-10 12:37:48,152] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt... +30: [2023-05-10 12:37:48,157] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +30: [2023-05-10 12:37:48,157] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +30: [2023-05-10 12:37:48,157] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt... +30: [2023-05-10 12:37:48,157] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt... +30: [2023-05-10 12:37:48,162] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +30: [2023-05-10 12:37:48,162] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt... +30: [2023-05-10 12:37:48,163] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +30: [2023-05-10 12:37:48,167] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +30: [2023-05-10 12:37:48,170] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +30: [2023-05-10 12:37:48,170] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +26: [2023-05-10 12:37:48,172] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +26: [2023-05-10 12:37:48,173] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +26: [2023-05-10 12:37:48,174] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +26: [2023-05-10 12:37:48,175] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +28: [2023-05-10 12:37:48,175] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +28: [2023-05-10 12:37:48,175] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +26: [2023-05-10 12:37:48,176] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... + 8: [2023-05-10 12:37:48,176] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_32_mp_rank_00_optim_states.pt... + 8: [2023-05-10 12:37:48,176] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_33_mp_rank_00_optim_states.pt... + 8: [2023-05-10 12:37:48,176] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_34_mp_rank_00_optim_states.pt... +28: [2023-05-10 12:37:48,176] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. + 8: [2023-05-10 12:37:48,176] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_35_mp_rank_00_optim_states.pt... +28: [2023-05-10 12:37:48,177] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +28: [2023-05-10 12:37:48,177] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +28: [2023-05-10 12:37:48,177] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +28: [2023-05-10 12:37:48,178] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +26: [2023-05-10 12:37:48,178] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +26: [2023-05-10 12:37:48,178] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +26: [2023-05-10 12:37:48,178] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +26: [2023-05-10 12:37:48,178] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +26: [2023-05-10 12:37:48,178] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +26: [2023-05-10 12:37:48,178] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +26: [2023-05-10 12:37:48,178] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +26: [2023-05-10 12:37:48,178] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +26: [2023-05-10 12:37:48,179] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +26: [2023-05-10 12:37:48,179] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +26: [2023-05-10 12:37:48,179] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +26: [2023-05-10 12:37:48,179] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +28: [2023-05-10 12:37:48,180] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +28: [2023-05-10 12:37:48,180] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +12: [2023-05-10 12:37:48,180] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +12: [2023-05-10 12:37:48,180] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +12: [2023-05-10 12:37:48,180] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +28: [2023-05-10 12:37:48,180] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +12: [2023-05-10 12:37:48,180] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +12: [2023-05-10 12:37:48,180] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +12: [2023-05-10 12:37:48,180] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +12: [2023-05-10 12:37:48,180] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +12: [2023-05-10 12:37:48,180] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +28: [2023-05-10 12:37:48,181] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +17: [2023-05-10 12:37:48,187] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +17: [2023-05-10 12:37:48,187] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +17: [2023-05-10 12:37:48,187] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +17: [2023-05-10 12:37:48,187] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +17: [2023-05-10 12:37:48,187] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +26: [2023-05-10 12:37:48,188] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +17: [2023-05-10 12:37:48,189] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +26: [2023-05-10 12:37:48,189] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt... +17: [2023-05-10 12:37:48,189] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +17: [2023-05-10 12:37:48,189] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +28: [2023-05-10 12:37:48,190] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +26: [2023-05-10 12:37:48,192] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +26: [2023-05-10 12:37:48,192] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt... +12: [2023-05-10 12:37:48,195] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +12: [2023-05-10 12:37:48,195] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +12: [2023-05-10 12:37:48,196] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +12: [2023-05-10 12:37:48,196] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +26: [2023-05-10 12:37:48,198] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +26: [2023-05-10 12:37:48,198] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt... +17: [2023-05-10 12:37:48,199] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +28: [2023-05-10 12:37:48,199] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +28: [2023-05-10 12:37:48,200] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +28: [2023-05-10 12:37:48,200] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +28: [2023-05-10 12:37:48,200] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +28: [2023-05-10 12:37:48,203] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt. +28: [2023-05-10 12:37:48,203] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt. +28: [2023-05-10 12:37:48,203] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt. +28: [2023-05-10 12:37:48,203] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt. +26: [2023-05-10 12:37:48,203] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +15: [2023-05-10 12:37:48,204] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +15: [2023-05-10 12:37:48,204] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +15: [2023-05-10 12:37:48,204] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +15: [2023-05-10 12:37:48,204] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +15: [2023-05-10 12:37:48,204] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +15: [2023-05-10 12:37:48,204] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +15: [2023-05-10 12:37:48,204] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +15: [2023-05-10 12:37:48,204] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +12: [2023-05-10 12:37:48,205] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +26: [2023-05-10 12:37:48,205] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt... +12: [2023-05-10 12:37:48,205] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +12: [2023-05-10 12:37:48,205] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +12: [2023-05-10 12:37:48,206] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +17: [2023-05-10 12:37:48,207] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +12: [2023-05-10 12:37:48,208] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +12: [2023-05-10 12:37:48,208] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +12: [2023-05-10 12:37:48,208] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +12: [2023-05-10 12:37:48,208] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +12: [2023-05-10 12:37:48,208] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +12: [2023-05-10 12:37:48,209] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +12: [2023-05-10 12:37:48,209] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +12: [2023-05-10 12:37:48,209] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +12: [2023-05-10 12:37:48,209] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +12: [2023-05-10 12:37:48,209] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +12: [2023-05-10 12:37:48,209] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +12: [2023-05-10 12:37:48,209] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +17: [2023-05-10 12:37:48,210] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +17: [2023-05-10 12:37:48,210] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +17: [2023-05-10 12:37:48,210] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +17: [2023-05-10 12:37:48,212] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +28: [2023-05-10 12:37:48,212] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +28: [2023-05-10 12:37:48,213] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +28: [2023-05-10 12:37:48,213] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +28: [2023-05-10 12:37:48,213] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +30: [2023-05-10 12:37:48,176] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +30: [2023-05-10 12:37:48,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +30: [2023-05-10 12:37:48,181] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +30: [2023-05-10 12:37:48,181] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +30: [2023-05-10 12:37:48,181] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +30: [2023-05-10 12:37:48,182] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +30: [2023-05-10 12:37:48,182] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +30: [2023-05-10 12:37:48,182] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +30: [2023-05-10 12:37:48,182] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +30: [2023-05-10 12:37:48,182] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +30: [2023-05-10 12:37:48,182] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +30: [2023-05-10 12:37:48,182] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +30: [2023-05-10 12:37:48,183] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +30: [2023-05-10 12:37:48,183] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +30: [2023-05-10 12:37:48,183] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +30: [2023-05-10 12:37:48,183] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +15: [2023-05-10 12:37:48,216] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +30: [2023-05-10 12:37:48,219] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_121_mp_rank_00_optim_states.pt... +30: [2023-05-10 12:37:48,219] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_123_mp_rank_00_optim_states.pt... +30: [2023-05-10 12:37:48,219] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_120_mp_rank_00_optim_states.pt... +17: [2023-05-10 12:37:48,219] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +17: [2023-05-10 12:37:48,219] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +30: [2023-05-10 12:37:48,219] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_122_mp_rank_00_optim_states.pt... +15: [2023-05-10 12:37:48,221] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +26: [2023-05-10 12:37:48,221] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_104_mp_rank_00_optim_states.pt... +26: [2023-05-10 12:37:48,221] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_105_mp_rank_00_optim_states.pt... +26: [2023-05-10 12:37:48,221] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_107_mp_rank_00_optim_states.pt... +26: [2023-05-10 12:37:48,221] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_106_mp_rank_00_optim_states.pt... +27: [2023-05-10 12:37:48,221] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +27: [2023-05-10 12:37:48,221] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +17: [2023-05-10 12:37:48,221] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +27: [2023-05-10 12:37:48,221] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +27: [2023-05-10 12:37:48,221] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +27: [2023-05-10 12:37:48,221] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +27: [2023-05-10 12:37:48,221] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +27: [2023-05-10 12:37:48,221] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +27: [2023-05-10 12:37:48,221] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +17: [2023-05-10 12:37:48,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +17: [2023-05-10 12:37:48,222] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +28: [2023-05-10 12:37:48,222] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_115_mp_rank_00_optim_states.pt... +28: [2023-05-10 12:37:48,222] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_113_mp_rank_00_optim_states.pt... +28: [2023-05-10 12:37:48,222] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_114_mp_rank_00_optim_states.pt... +28: [2023-05-10 12:37:48,222] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_112_mp_rank_00_optim_states.pt... +15: [2023-05-10 12:37:48,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +17: [2023-05-10 12:37:48,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +15: [2023-05-10 12:37:48,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +15: [2023-05-10 12:37:48,225] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +28: [2023-05-10 12:37:48,226] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +28: [2023-05-10 12:37:48,227] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +28: [2023-05-10 12:37:48,227] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt... +28: [2023-05-10 12:37:48,227] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt... +17: [2023-05-10 12:37:48,229] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +15: [2023-05-10 12:37:48,229] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +15: [2023-05-10 12:37:48,229] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +17: [2023-05-10 12:37:48,230] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +17: [2023-05-10 12:37:48,230] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +17: [2023-05-10 12:37:48,230] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +15: [2023-05-10 12:37:48,230] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +15: [2023-05-10 12:37:48,231] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +28: [2023-05-10 12:37:48,231] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +17: [2023-05-10 12:37:48,231] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +15: [2023-05-10 12:37:48,231] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +15: [2023-05-10 12:37:48,232] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +17: [2023-05-10 12:37:48,232] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +15: [2023-05-10 12:37:48,232] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +17: [2023-05-10 12:37:48,232] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +15: [2023-05-10 12:37:48,232] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +15: [2023-05-10 12:37:48,232] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +17: [2023-05-10 12:37:48,232] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +28: [2023-05-10 12:37:48,232] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +15: [2023-05-10 12:37:48,232] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +28: [2023-05-10 12:37:48,232] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt... +15: [2023-05-10 12:37:48,232] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +15: [2023-05-10 12:37:48,232] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +28: [2023-05-10 12:37:48,232] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt... +15: [2023-05-10 12:37:48,232] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +15: [2023-05-10 12:37:48,233] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +15: [2023-05-10 12:37:48,233] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +27: [2023-05-10 12:37:48,234] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +27: [2023-05-10 12:37:48,235] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +27: [2023-05-10 12:37:48,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +27: [2023-05-10 12:37:48,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +19: [2023-05-10 12:37:48,238] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +19: [2023-05-10 12:37:48,238] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +19: [2023-05-10 12:37:48,238] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +19: [2023-05-10 12:37:48,238] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +19: [2023-05-10 12:37:48,238] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +19: [2023-05-10 12:37:48,238] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +19: [2023-05-10 12:37:48,238] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +19: [2023-05-10 12:37:48,238] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +12: [2023-05-10 12:37:48,243] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_50_mp_rank_00_optim_states.pt... +12: [2023-05-10 12:37:48,243] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_49_mp_rank_00_optim_states.pt... +12: [2023-05-10 12:37:48,243] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_48_mp_rank_00_optim_states.pt... +12: [2023-05-10 12:37:48,243] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_51_mp_rank_00_optim_states.pt... +27: [2023-05-10 12:37:48,245] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +27: [2023-05-10 12:37:48,245] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +27: [2023-05-10 12:37:48,246] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +17: [2023-05-10 12:37:48,247] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_68_mp_rank_00_optim_states.pt... +17: [2023-05-10 12:37:48,247] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_71_mp_rank_00_optim_states.pt... +17: [2023-05-10 12:37:48,247] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_69_mp_rank_00_optim_states.pt... +17: [2023-05-10 12:37:48,247] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_70_mp_rank_00_optim_states.pt... +27: [2023-05-10 12:37:48,248] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +27: [2023-05-10 12:37:48,250] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +27: [2023-05-10 12:37:48,250] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +19: [2023-05-10 12:37:48,250] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +19: [2023-05-10 12:37:48,250] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +27: [2023-05-10 12:37:48,250] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +27: [2023-05-10 12:37:48,250] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +27: [2023-05-10 12:37:48,250] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +27: [2023-05-10 12:37:48,250] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +27: [2023-05-10 12:37:48,250] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +27: [2023-05-10 12:37:48,250] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +27: [2023-05-10 12:37:48,250] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +27: [2023-05-10 12:37:48,251] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +27: [2023-05-10 12:37:48,251] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +27: [2023-05-10 12:37:48,251] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +19: [2023-05-10 12:37:48,253] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +19: [2023-05-10 12:37:48,255] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. + 0: [2023-05-10 12:37:48,256] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. + 0: [2023-05-10 12:37:48,256] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. + 0: [2023-05-10 12:37:48,256] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. + 0: [2023-05-10 12:37:48,256] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... + 0: [2023-05-10 12:37:48,256] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... + 0: [2023-05-10 12:37:48,256] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... + 0: [2023-05-10 12:37:48,256] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. + 0: [2023-05-10 12:37:48,258] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +19: [2023-05-10 12:37:48,261] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +19: [2023-05-10 12:37:48,262] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +19: [2023-05-10 12:37:48,262] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +19: [2023-05-10 12:37:48,264] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +16: [2023-05-10 12:37:48,265] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +16: [2023-05-10 12:37:48,265] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +16: [2023-05-10 12:37:48,265] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +16: [2023-05-10 12:37:48,265] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +16: [2023-05-10 12:37:48,265] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +16: [2023-05-10 12:37:48,265] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +16: [2023-05-10 12:37:48,265] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +19: [2023-05-10 12:37:48,265] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +19: [2023-05-10 12:37:48,265] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +19: [2023-05-10 12:37:48,265] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +19: [2023-05-10 12:37:48,265] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +19: [2023-05-10 12:37:48,265] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +19: [2023-05-10 12:37:48,265] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +19: [2023-05-10 12:37:48,265] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +19: [2023-05-10 12:37:48,265] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +19: [2023-05-10 12:37:48,266] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +19: [2023-05-10 12:37:48,266] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +19: [2023-05-10 12:37:48,266] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +19: [2023-05-10 12:37:48,266] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +16: [2023-05-10 12:37:48,266] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +15: [2023-05-10 12:37:48,268] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_63_mp_rank_00_optim_states.pt... +15: [2023-05-10 12:37:48,268] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_60_mp_rank_00_optim_states.pt... +15: [2023-05-10 12:37:48,268] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_61_mp_rank_00_optim_states.pt... +15: [2023-05-10 12:37:48,268] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_62_mp_rank_00_optim_states.pt... +16: [2023-05-10 12:37:48,276] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +16: [2023-05-10 12:37:48,277] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. + 0: [2023-05-10 12:37:48,279] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. + 0: [2023-05-10 12:37:48,279] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. + 0: [2023-05-10 12:37:48,279] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +10: [2023-05-10 12:37:48,279] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +10: [2023-05-10 12:37:48,279] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +10: [2023-05-10 12:37:48,279] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +10: [2023-05-10 12:37:48,279] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +16: [2023-05-10 12:37:48,280] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +10: [2023-05-10 12:37:48,281] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +10: [2023-05-10 12:37:48,281] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +10: [2023-05-10 12:37:48,282] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +10: [2023-05-10 12:37:48,283] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +27: [2023-05-10 12:37:48,283] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_108_mp_rank_00_optim_states.pt... +27: [2023-05-10 12:37:48,283] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_109_mp_rank_00_optim_states.pt... +27: [2023-05-10 12:37:48,283] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_110_mp_rank_00_optim_states.pt... +27: [2023-05-10 12:37:48,283] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_111_mp_rank_00_optim_states.pt... +16: [2023-05-10 12:37:48,286] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +16: [2023-05-10 12:37:48,286] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... + 0: [2023-05-10 12:37:48,289] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... + 0: [2023-05-10 12:37:48,289] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +16: [2023-05-10 12:37:48,290] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +16: [2023-05-10 12:37:48,290] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +16: [2023-05-10 12:37:48,290] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +16: [2023-05-10 12:37:48,291] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +16: [2023-05-10 12:37:48,291] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... + 0: [2023-05-10 12:37:48,291] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +16: [2023-05-10 12:37:48,291] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +16: [2023-05-10 12:37:48,291] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +16: [2023-05-10 12:37:48,291] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +16: [2023-05-10 12:37:48,291] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +16: [2023-05-10 12:37:48,291] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. + 0: [2023-05-10 12:37:48,292] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. + 0: [2023-05-10 12:37:48,292] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. + 0: [2023-05-10 12:37:48,292] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... + 0: [2023-05-10 12:37:48,292] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... + 0: [2023-05-10 12:37:48,293] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. + 0: [2023-05-10 12:37:48,293] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... + 0: [2023-05-10 12:37:48,293] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +16: [2023-05-10 12:37:48,293] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. + 0: [2023-05-10 12:37:48,293] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. + 0: [2023-05-10 12:37:48,293] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +19: [2023-05-10 12:37:48,298] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_77_mp_rank_00_optim_states.pt... +19: [2023-05-10 12:37:48,298] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_76_mp_rank_00_optim_states.pt... +19: [2023-05-10 12:37:48,298] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_79_mp_rank_00_optim_states.pt... +19: [2023-05-10 12:37:48,298] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_78_mp_rank_00_optim_states.pt... + 0: [2023-05-10 12:37:48,298] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +10: [2023-05-10 12:37:48,298] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +10: [2023-05-10 12:37:48,299] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +10: [2023-05-10 12:37:48,299] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +16: [2023-05-10 12:37:48,302] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +16: [2023-05-10 12:37:48,302] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +16: [2023-05-10 12:37:48,302] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +16: [2023-05-10 12:37:48,302] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. + 0: [2023-05-10 12:37:48,307] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... + 0: [2023-05-10 12:37:48,307] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. + 0: [2023-05-10 12:37:48,307] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... + 0: [2023-05-10 12:37:48,308] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +10: [2023-05-10 12:37:48,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. + 0: > overriding learning rate value to 0.0002 + 0: > overriding minimum learning rate value to 2e-05 + 0: > overriding warmup iterations value to 0 + 0: > overriding total number of iterations value to 1 +10: [2023-05-10 12:37:48,311] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... + 0: > overriding decay style value to cosine +10: [2023-05-10 12:37:48,311] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +10: [2023-05-10 12:37:48,311] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +10: [2023-05-10 12:37:48,314] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +10: [2023-05-10 12:37:48,314] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +10: [2023-05-10 12:37:48,314] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +10: [2023-05-10 12:37:48,314] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +10: [2023-05-10 12:37:48,314] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +10: [2023-05-10 12:37:48,314] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +10: [2023-05-10 12:37:48,315] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +10: [2023-05-10 12:37:48,315] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +10: [2023-05-10 12:37:48,315] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +10: [2023-05-10 12:37:48,317] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +10: [2023-05-10 12:37:48,318] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +10: [2023-05-10 12:37:48,318] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +10: [2023-05-10 12:37:48,318] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +13: [2023-05-10 12:37:48,319] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +13: [2023-05-10 12:37:48,319] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +13: [2023-05-10 12:37:48,319] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +13: [2023-05-10 12:37:48,319] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +13: [2023-05-10 12:37:48,319] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +13: [2023-05-10 12:37:48,319] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +13: [2023-05-10 12:37:48,319] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +13: [2023-05-10 12:37:48,320] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +16: [2023-05-10 12:37:48,325] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_64_mp_rank_00_optim_states.pt... +16: [2023-05-10 12:37:48,325] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_66_mp_rank_00_optim_states.pt... +16: [2023-05-10 12:37:48,325] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_65_mp_rank_00_optim_states.pt... +16: [2023-05-10 12:37:48,325] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_67_mp_rank_00_optim_states.pt... + 0: [2023-05-10 12:37:48,327] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt... + 0: [2023-05-10 12:37:48,327] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt... + 0: [2023-05-10 12:37:48,327] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt... + 0: [2023-05-10 12:37:48,327] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt... +15: [2023-05-10 12:37:48,328] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt. +15: [2023-05-10 12:37:48,328] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt. +15: [2023-05-10 12:37:48,328] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt. +15: [2023-05-10 12:37:48,329] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt. + 1: [2023-05-10 12:37:48,329] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt. + 1: [2023-05-10 12:37:48,329] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt. + 1: [2023-05-10 12:37:48,329] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt. + 1: [2023-05-10 12:37:48,329] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt. +13: [2023-05-10 12:37:48,329] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. + 1: [2023-05-10 12:37:48,338] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +13: [2023-05-10 12:37:48,338] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +13: [2023-05-10 12:37:48,338] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. + 1: [2023-05-10 12:37:48,338] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... + 1: [2023-05-10 12:37:48,338] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... + 1: [2023-05-10 12:37:48,338] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +15: [2023-05-10 12:37:48,338] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +15: [2023-05-10 12:37:48,339] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +20: [2023-05-10 12:37:48,339] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +20: [2023-05-10 12:37:48,339] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +20: [2023-05-10 12:37:48,339] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +20: [2023-05-10 12:37:48,339] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +20: [2023-05-10 12:37:48,339] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +20: [2023-05-10 12:37:48,339] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +15: [2023-05-10 12:37:48,340] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +20: [2023-05-10 12:37:48,340] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +20: [2023-05-10 12:37:48,340] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +13: [2023-05-10 12:37:48,340] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +15: [2023-05-10 12:37:48,340] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +13: [2023-05-10 12:37:48,347] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +13: [2023-05-10 12:37:48,347] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... + 5: [2023-05-10 12:37:48,348] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt. +13: [2023-05-10 12:37:48,348] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. + 5: [2023-05-10 12:37:48,349] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt. +13: [2023-05-10 12:37:48,350] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +13: [2023-05-10 12:37:48,350] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +13: [2023-05-10 12:37:48,351] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +13: [2023-05-10 12:37:48,351] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +23: [2023-05-10 12:37:48,351] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt. +23: [2023-05-10 12:37:48,351] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt. +13: [2023-05-10 12:37:48,351] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +13: [2023-05-10 12:37:48,351] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +13: [2023-05-10 12:37:48,351] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +13: [2023-05-10 12:37:48,351] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +23: [2023-05-10 12:37:48,352] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt. +23: [2023-05-10 12:37:48,352] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt. +20: [2023-05-10 12:37:48,353] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +20: [2023-05-10 12:37:48,354] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +20: [2023-05-10 12:37:48,354] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. + 5: [2023-05-10 12:37:48,354] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt. + 5: [2023-05-10 12:37:48,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt. +15: [2023-05-10 12:37:48,357] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +15: [2023-05-10 12:37:48,359] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt... + 5: [2023-05-10 12:37:48,359] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +13: [2023-05-10 12:37:48,359] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +10: [2023-05-10 12:37:48,360] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_41_mp_rank_00_optim_states.pt... +10: [2023-05-10 12:37:48,360] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_42_mp_rank_00_optim_states.pt... +10: [2023-05-10 12:37:48,360] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_40_mp_rank_00_optim_states.pt... +10: [2023-05-10 12:37:48,360] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_43_mp_rank_00_optim_states.pt... +23: [2023-05-10 12:37:48,360] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +20: [2023-05-10 12:37:48,360] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. + 5: [2023-05-10 12:37:48,360] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +23: [2023-05-10 12:37:48,361] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +23: [2023-05-10 12:37:48,361] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +23: [2023-05-10 12:37:48,362] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +20: [2023-05-10 12:37:48,362] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... + 9: [2023-05-10 12:37:48,362] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. + 9: [2023-05-10 12:37:48,362] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. + 9: [2023-05-10 12:37:48,363] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... + 9: [2023-05-10 12:37:48,363] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +15: [2023-05-10 12:37:48,363] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +15: [2023-05-10 12:37:48,363] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt... +20: [2023-05-10 12:37:48,364] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +10: [2023-05-10 12:37:48,364] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt. +10: [2023-05-10 12:37:48,364] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt. +10: [2023-05-10 12:37:48,364] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt. +10: [2023-05-10 12:37:48,364] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt. + 9: [2023-05-10 12:37:48,365] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. + 9: [2023-05-10 12:37:48,365] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... + 9: [2023-05-10 12:37:48,365] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. + 9: [2023-05-10 12:37:48,365] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +20: [2023-05-10 12:37:48,365] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +20: [2023-05-10 12:37:48,366] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... + 5: [2023-05-10 12:37:48,366] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +20: [2023-05-10 12:37:48,366] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +26: [2023-05-10 12:37:48,366] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt. +26: [2023-05-10 12:37:48,366] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt. +26: [2023-05-10 12:37:48,366] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt. +30: [2023-05-10 12:37:48,366] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt. +15: [2023-05-10 12:37:48,367] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +30: [2023-05-10 12:37:48,367] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt. +30: [2023-05-10 12:37:48,367] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt. +30: [2023-05-10 12:37:48,367] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt. +20: [2023-05-10 12:37:48,368] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +20: [2023-05-10 12:37:48,368] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +26: [2023-05-10 12:37:48,368] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt. +13: [2023-05-10 12:37:48,368] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +20: [2023-05-10 12:37:48,368] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +15: [2023-05-10 12:37:48,368] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt... +13: [2023-05-10 12:37:48,368] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +13: [2023-05-10 12:37:48,368] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +15: [2023-05-10 12:37:48,368] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +20: [2023-05-10 12:37:48,368] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. + 5: [2023-05-10 12:37:48,368] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +20: [2023-05-10 12:37:48,369] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +13: [2023-05-10 12:37:48,369] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +20: [2023-05-10 12:37:48,369] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +20: [2023-05-10 12:37:48,369] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +20: [2023-05-10 12:37:48,369] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +20: [2023-05-10 12:37:48,369] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +20: [2023-05-10 12:37:48,369] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. + 8: [2023-05-10 12:37:48,369] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt. +20: [2023-05-10 12:37:48,369] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. + 8: [2023-05-10 12:37:48,369] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt. + 8: [2023-05-10 12:37:48,369] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt. + 8: [2023-05-10 12:37:48,370] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt. +23: [2023-05-10 12:37:48,370] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +23: [2023-05-10 12:37:48,370] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +11: [2023-05-10 12:37:48,370] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +11: [2023-05-10 12:37:48,370] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +11: [2023-05-10 12:37:48,371] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +15: [2023-05-10 12:37:48,371] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt... +11: [2023-05-10 12:37:48,371] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +23: [2023-05-10 12:37:48,371] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +23: [2023-05-10 12:37:48,371] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +24: [2023-05-10 12:37:48,372] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt. +24: [2023-05-10 12:37:48,372] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt. +23: [2023-05-10 12:37:48,372] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +24: [2023-05-10 12:37:48,372] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt. +24: [2023-05-10 12:37:48,372] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt. +23: [2023-05-10 12:37:48,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... + 1: [2023-05-10 12:37:48,373] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. + 1: [2023-05-10 12:37:48,373] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... + 4: [2023-05-10 12:37:48,373] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +28: [2023-05-10 12:37:48,373] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt. + 4: [2023-05-10 12:37:48,373] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +28: [2023-05-10 12:37:48,373] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt. +28: [2023-05-10 12:37:48,373] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt. + 1: [2023-05-10 12:37:48,373] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +28: [2023-05-10 12:37:48,373] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt. + 1: [2023-05-10 12:37:48,374] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... + 1: [2023-05-10 12:37:48,374] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. + 1: [2023-05-10 12:37:48,374] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. + 1: [2023-05-10 12:37:48,374] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. + 1: [2023-05-10 12:37:48,374] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... + 9: [2023-05-10 12:37:48,374] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. + 1: [2023-05-10 12:37:48,375] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt... + 1: [2023-05-10 12:37:48,375] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt... +11: [2023-05-10 12:37:48,374] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +11: [2023-05-10 12:37:48,374] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +10: [2023-05-10 12:37:48,375] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... + 1: [2023-05-10 12:37:48,375] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. + 1: [2023-05-10 12:37:48,376] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt... + 4: [2023-05-10 12:37:48,375] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. + 9: [2023-05-10 12:37:48,376] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +11: [2023-05-10 12:37:48,376] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +11: [2023-05-10 12:37:48,376] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +10: [2023-05-10 12:37:48,376] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... + 7: [2023-05-10 12:37:48,376] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. + 7: [2023-05-10 12:37:48,376] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. + 7: [2023-05-10 12:37:48,376] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... + 7: [2023-05-10 12:37:48,376] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... + 3: [2023-05-10 12:37:48,376] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt. +30: [2023-05-10 12:37:48,376] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +21: [2023-05-10 12:37:48,377] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +23: [2023-05-10 12:37:48,376] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +23: [2023-05-10 12:37:48,376] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +21: [2023-05-10 12:37:48,377] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... + 4: [2023-05-10 12:37:48,377] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +30: [2023-05-10 12:37:48,377] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +21: [2023-05-10 12:37:48,377] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +21: [2023-05-10 12:37:48,377] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +21: [2023-05-10 12:37:48,377] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +21: [2023-05-10 12:37:48,377] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +10: [2023-05-10 12:37:48,377] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +30: [2023-05-10 12:37:48,378] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt... +21: [2023-05-10 12:37:48,378] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +21: [2023-05-10 12:37:48,378] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... + 3: [2023-05-10 12:37:48,378] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt. + 4: [2023-05-10 12:37:48,378] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. + 4: [2023-05-10 12:37:48,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +10: [2023-05-10 12:37:48,378] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... + 8: [2023-05-10 12:37:48,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... + 4: [2023-05-10 12:37:48,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +26: [2023-05-10 12:37:48,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +26: [2023-05-10 12:37:48,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +23: [2023-05-10 12:37:48,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. + 8: [2023-05-10 12:37:48,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +26: [2023-05-10 12:37:48,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +26: [2023-05-10 12:37:48,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. + 8: [2023-05-10 12:37:48,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... + 8: [2023-05-10 12:37:48,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +30: [2023-05-10 12:37:48,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +30: [2023-05-10 12:37:48,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +23: [2023-05-10 12:37:48,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt... + 7: [2023-05-10 12:37:48,380] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +30: [2023-05-10 12:37:48,380] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. + 9: [2023-05-10 12:37:48,380] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +26: [2023-05-10 12:37:48,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt... +30: [2023-05-10 12:37:48,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt... +26: [2023-05-10 12:37:48,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt... +30: [2023-05-10 12:37:48,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +30: [2023-05-10 12:37:48,380] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +30: [2023-05-10 12:37:48,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt... + 4: [2023-05-10 12:37:48,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... + 1: [2023-05-10 12:37:48,380] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +30: [2023-05-10 12:37:48,381] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. + 3: [2023-05-10 12:37:48,380] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt. + 1: [2023-05-10 12:37:48,381] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +30: [2023-05-10 12:37:48,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt... + 1: [2023-05-10 12:37:48,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt... + 7: [2023-05-10 12:37:48,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... + 7: [2023-05-10 12:37:48,381] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. + 3: [2023-05-10 12:37:48,381] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt. + 9: [2023-05-10 12:37:48,381] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. + 7: [2023-05-10 12:37:48,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +24: [2023-05-10 12:37:48,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +26: [2023-05-10 12:37:48,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +24: [2023-05-10 12:37:48,382] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +26: [2023-05-10 12:37:48,382] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +26: [2023-05-10 12:37:48,382] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +26: [2023-05-10 12:37:48,382] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt... +26: [2023-05-10 12:37:48,382] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +26: [2023-05-10 12:37:48,382] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt... + 1: [2023-05-10 12:37:48,382] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +24: [2023-05-10 12:37:48,383] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt... +23: [2023-05-10 12:37:48,383] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +24: [2023-05-10 12:37:48,383] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +28: [2023-05-10 12:37:48,383] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +28: [2023-05-10 12:37:48,383] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +24: [2023-05-10 12:37:48,383] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +24: [2023-05-10 12:37:48,383] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt... +28: [2023-05-10 12:37:48,383] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +28: [2023-05-10 12:37:48,384] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. + 9: [2023-05-10 12:37:48,384] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +28: [2023-05-10 12:37:48,384] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +24: [2023-05-10 12:37:48,384] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +28: [2023-05-10 12:37:48,384] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt... +28: [2023-05-10 12:37:48,384] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt... +23: [2023-05-10 12:37:48,384] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +23: [2023-05-10 12:37:48,384] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +28: [2023-05-10 12:37:48,384] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +23: [2023-05-10 12:37:48,384] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt... +23: [2023-05-10 12:37:48,384] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt... +24: [2023-05-10 12:37:48,384] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +28: [2023-05-10 12:37:48,384] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +28: [2023-05-10 12:37:48,384] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt... +24: [2023-05-10 12:37:48,385] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt... +24: [2023-05-10 12:37:48,385] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +28: [2023-05-10 12:37:48,385] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +11: [2023-05-10 12:37:48,385] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +11: [2023-05-10 12:37:48,385] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +28: [2023-05-10 12:37:48,385] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt... +24: [2023-05-10 12:37:48,385] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +24: [2023-05-10 12:37:48,385] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt... + 9: [2023-05-10 12:37:48,385] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +23: [2023-05-10 12:37:48,386] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +23: [2023-05-10 12:37:48,386] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt... + 3: [2023-05-10 12:37:48,387] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... + 3: [2023-05-10 12:37:48,387] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +10: [2023-05-10 12:37:48,388] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +23: [2023-05-10 12:37:48,389] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. + 1: [2023-05-10 12:37:48,389] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. + 9: [2023-05-10 12:37:48,389] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... + 9: [2023-05-10 12:37:48,389] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +10: [2023-05-10 12:37:48,390] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt... + 3: [2023-05-10 12:37:48,390] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... + 1: [2023-05-10 12:37:48,390] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. + 6: [2023-05-10 12:37:48,390] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. + 6: [2023-05-10 12:37:48,390] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... + 1: [2023-05-10 12:37:48,391] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. + 3: [2023-05-10 12:37:48,391] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +21: [2023-05-10 12:37:48,391] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +26: [2023-05-10 12:37:48,391] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt. +26: [2023-05-10 12:37:48,391] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt. +26: [2023-05-10 12:37:48,391] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt. +24: [2023-05-10 12:37:48,391] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt. +28: [2023-05-10 12:37:48,391] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt. +28: [2023-05-10 12:37:48,391] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt. + 6: [2023-05-10 12:37:48,391] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +24: [2023-05-10 12:37:48,391] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt. +24: [2023-05-10 12:37:48,391] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt. +28: [2023-05-10 12:37:48,391] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt. +21: [2023-05-10 12:37:48,391] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +30: [2023-05-10 12:37:48,391] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt. +28: [2023-05-10 12:37:48,391] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt. +23: [2023-05-10 12:37:48,391] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +30: [2023-05-10 12:37:48,391] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt. +30: [2023-05-10 12:37:48,391] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt. +24: [2023-05-10 12:37:48,391] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt. + 5: [2023-05-10 12:37:48,391] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. + 5: [2023-05-10 12:37:48,391] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. + 5: [2023-05-10 12:37:48,392] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +30: [2023-05-10 12:37:48,391] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt. + 5: [2023-05-10 12:37:48,392] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +26: [2023-05-10 12:37:48,392] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt. +23: [2023-05-10 12:37:48,392] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... + 6: [2023-05-10 12:37:48,392] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. + 6: [2023-05-10 12:37:48,392] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. + 6: [2023-05-10 12:37:48,392] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... + 6: [2023-05-10 12:37:48,392] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +21: [2023-05-10 12:37:48,392] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. + 4: [2023-05-10 12:37:48,393] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +21: [2023-05-10 12:37:48,393] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. + 7: [2023-05-10 12:37:48,392] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. + 9: [2023-05-10 12:37:48,393] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. + 9: [2023-05-10 12:37:48,393] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. + 9: [2023-05-10 12:37:48,393] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. + 9: [2023-05-10 12:37:48,393] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... + 9: [2023-05-10 12:37:48,393] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... + 9: [2023-05-10 12:37:48,393] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... + 9: [2023-05-10 12:37:48,393] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. + 9: [2023-05-10 12:37:48,393] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... + 4: [2023-05-10 12:37:48,394] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. + 9: [2023-05-10 12:37:48,394] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. + 9: [2023-05-10 12:37:48,394] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. + 9: [2023-05-10 12:37:48,394] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. + 6: [2023-05-10 12:37:48,394] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... + 9: [2023-05-10 12:37:48,394] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. + 5: [2023-05-10 12:37:48,394] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. + 5: [2023-05-10 12:37:48,394] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. + 5: [2023-05-10 12:37:48,395] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. + 5: [2023-05-10 12:37:48,395] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. + 5: [2023-05-10 12:37:48,395] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. + 5: [2023-05-10 12:37:48,395] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt... + 5: [2023-05-10 12:37:48,395] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt... + 5: [2023-05-10 12:37:48,395] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +18: [2023-05-10 12:37:48,395] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +18: [2023-05-10 12:37:48,395] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +18: [2023-05-10 12:37:48,395] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +18: [2023-05-10 12:37:48,395] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +18: [2023-05-10 12:37:48,395] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +18: [2023-05-10 12:37:48,395] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +13: [2023-05-10 12:37:48,395] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_53_mp_rank_00_optim_states.pt... +13: [2023-05-10 12:37:48,395] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_55_mp_rank_00_optim_states.pt... +13: [2023-05-10 12:37:48,395] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_54_mp_rank_00_optim_states.pt... +13: [2023-05-10 12:37:48,395] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_52_mp_rank_00_optim_states.pt... + 5: [2023-05-10 12:37:48,396] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +18: [2023-05-10 12:37:48,396] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. + 5: [2023-05-10 12:37:48,396] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt... +11: [2023-05-10 12:37:48,396] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +11: [2023-05-10 12:37:48,396] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... + 8: [2023-05-10 12:37:48,396] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. + 7: [2023-05-10 12:37:48,396] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. + 8: [2023-05-10 12:37:48,396] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. + 8: [2023-05-10 12:37:48,396] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. + 5: [2023-05-10 12:37:48,397] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... + 8: [2023-05-10 12:37:48,397] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt... + 8: [2023-05-10 12:37:48,397] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt... + 8: [2023-05-10 12:37:48,397] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt... +18: [2023-05-10 12:37:48,397] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... + 5: [2023-05-10 12:37:48,397] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt... +23: [2023-05-10 12:37:48,397] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +23: [2023-05-10 12:37:48,397] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +23: [2023-05-10 12:37:48,398] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... + 3: [2023-05-10 12:37:48,398] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. + 3: [2023-05-10 12:37:48,398] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... + 3: [2023-05-10 12:37:48,398] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +23: [2023-05-10 12:37:48,398] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +11: [2023-05-10 12:37:48,398] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. + 3: [2023-05-10 12:37:48,398] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +11: [2023-05-10 12:37:48,398] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +11: [2023-05-10 12:37:48,398] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +11: [2023-05-10 12:37:48,399] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +23: [2023-05-10 12:37:48,399] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. + 1: [2023-05-10 12:37:48,399] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +23: [2023-05-10 12:37:48,399] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +23: [2023-05-10 12:37:48,399] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +11: [2023-05-10 12:37:48,399] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. + 4: [2023-05-10 12:37:48,399] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +11: [2023-05-10 12:37:48,399] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +23: [2023-05-10 12:37:48,399] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. + 8: [2023-05-10 12:37:48,400] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. + 8: [2023-05-10 12:37:48,400] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt... +11: [2023-05-10 12:37:48,401] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +11: [2023-05-10 12:37:48,401] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +29: [2023-05-10 12:37:48,401] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +29: [2023-05-10 12:37:48,401] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +21: [2023-05-10 12:37:48,401] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +23: [2023-05-10 12:37:48,401] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... + 7: [2023-05-10 12:37:48,401] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. + 3: [2023-05-10 12:37:48,401] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +23: [2023-05-10 12:37:48,401] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. + 3: [2023-05-10 12:37:48,401] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +23: [2023-05-10 12:37:48,401] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +23: [2023-05-10 12:37:48,402] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +29: [2023-05-10 12:37:48,402] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +29: [2023-05-10 12:37:48,402] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +21: [2023-05-10 12:37:48,402] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +29: [2023-05-10 12:37:48,402] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +21: [2023-05-10 12:37:48,402] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... + 3: [2023-05-10 12:37:48,402] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. + 1: [2023-05-10 12:37:48,402] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... + 1: [2023-05-10 12:37:48,402] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +25: [2023-05-10 12:37:48,402] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +10: [2023-05-10 12:37:48,402] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +10: [2023-05-10 12:37:48,402] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +25: [2023-05-10 12:37:48,403] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... + 6: [2023-05-10 12:37:48,403] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +29: [2023-05-10 12:37:48,403] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +29: [2023-05-10 12:37:48,403] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +29: [2023-05-10 12:37:48,403] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... + 7: [2023-05-10 12:37:48,403] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +10: [2023-05-10 12:37:48,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt... +25: [2023-05-10 12:37:48,404] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +25: [2023-05-10 12:37:48,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +21: [2023-05-10 12:37:48,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +10: [2023-05-10 12:37:48,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt... + 4: [2023-05-10 12:37:48,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +22: [2023-05-10 12:37:48,404] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +22: [2023-05-10 12:37:48,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +22: [2023-05-10 12:37:48,404] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +22: [2023-05-10 12:37:48,404] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +22: [2023-05-10 12:37:48,404] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +22: [2023-05-10 12:37:48,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +21: [2023-05-10 12:37:48,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +21: [2023-05-10 12:37:48,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +21: [2023-05-10 12:37:48,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +21: [2023-05-10 12:37:48,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +21: [2023-05-10 12:37:48,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +21: [2023-05-10 12:37:48,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +21: [2023-05-10 12:37:48,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +21: [2023-05-10 12:37:48,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... + 3: [2023-05-10 12:37:48,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... + 4: [2023-05-10 12:37:48,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +21: [2023-05-10 12:37:48,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +21: [2023-05-10 12:37:48,406] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +21: [2023-05-10 12:37:48,406] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +21: [2023-05-10 12:37:48,406] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. + 1: [2023-05-10 12:37:48,406] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. + 1: [2023-05-10 12:37:48,406] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. + 1: [2023-05-10 12:37:48,406] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... + 1: [2023-05-10 12:37:48,406] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... + 1: [2023-05-10 12:37:48,406] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. + 1: [2023-05-10 12:37:48,406] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +25: [2023-05-10 12:37:48,406] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +25: [2023-05-10 12:37:48,406] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +22: [2023-05-10 12:37:48,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... + 1: [2023-05-10 12:37:48,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +10: [2023-05-10 12:37:48,406] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +22: [2023-05-10 12:37:48,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... + 1: [2023-05-10 12:37:48,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. + 6: [2023-05-10 12:37:48,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. + 1: [2023-05-10 12:37:48,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. + 5: [2023-05-10 12:37:48,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. + 5: [2023-05-10 12:37:48,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +20: [2023-05-10 12:37:48,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_82_mp_rank_00_optim_states.pt... +20: [2023-05-10 12:37:48,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_80_mp_rank_00_optim_states.pt... +20: [2023-05-10 12:37:48,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_81_mp_rank_00_optim_states.pt... +20: [2023-05-10 12:37:48,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_83_mp_rank_00_optim_states.pt... + 7: [2023-05-10 12:37:48,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. + 7: [2023-05-10 12:37:48,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +25: [2023-05-10 12:37:48,408] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +10: [2023-05-10 12:37:48,408] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt... +23: [2023-05-10 12:37:48,408] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... + 7: [2023-05-10 12:37:48,408] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +25: [2023-05-10 12:37:48,408] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +23: [2023-05-10 12:37:48,408] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +23: [2023-05-10 12:37:48,408] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... + 4: [2023-05-10 12:37:48,408] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. + 4: [2023-05-10 12:37:48,408] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... + 4: [2023-05-10 12:37:48,408] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. + 4: [2023-05-10 12:37:48,408] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... + 4: [2023-05-10 12:37:48,409] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +23: [2023-05-10 12:37:48,409] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. + 4: [2023-05-10 12:37:48,409] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. + 4: [2023-05-10 12:37:48,409] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. + 4: [2023-05-10 12:37:48,409] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. + 4: [2023-05-10 12:37:48,409] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... + 5: [2023-05-10 12:37:48,409] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. + 4: [2023-05-10 12:37:48,409] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +11: [2023-05-10 12:37:48,410] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +11: [2023-05-10 12:37:48,410] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... + 3: [2023-05-10 12:37:48,409] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +11: [2023-05-10 12:37:48,410] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +11: [2023-05-10 12:37:48,410] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +11: [2023-05-10 12:37:48,410] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +11: [2023-05-10 12:37:48,410] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... + 7: [2023-05-10 12:37:48,410] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... + 3: [2023-05-10 12:37:48,410] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt... +11: [2023-05-10 12:37:48,410] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +11: [2023-05-10 12:37:48,410] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. + 3: [2023-05-10 12:37:48,410] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. + 3: [2023-05-10 12:37:48,411] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt... + 7: [2023-05-10 12:37:48,411] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. + 7: [2023-05-10 12:37:48,411] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... + 7: [2023-05-10 12:37:48,411] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. + 7: [2023-05-10 12:37:48,411] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. + 7: [2023-05-10 12:37:48,411] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... + 4: [2023-05-10 12:37:48,412] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. + 7: [2023-05-10 12:37:48,412] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. + 7: [2023-05-10 12:37:48,412] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... + 1: [2023-05-10 12:37:48,412] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. + 7: [2023-05-10 12:37:48,412] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +29: [2023-05-10 12:37:48,413] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. + 6: [2023-05-10 12:37:48,414] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... + 0: [2023-05-10 12:37:48,415] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt. + 0: [2023-05-10 12:37:48,415] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt. + 0: [2023-05-10 12:37:48,415] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt. + 0: [2023-05-10 12:37:48,415] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt. + 6: [2023-05-10 12:37:48,416] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... + 3: [2023-05-10 12:37:48,415] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. + 3: [2023-05-10 12:37:48,416] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +25: [2023-05-10 12:37:48,416] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. + 6: [2023-05-10 12:37:48,417] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +25: [2023-05-10 12:37:48,417] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. + 6: [2023-05-10 12:37:48,417] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... + 6: [2023-05-10 12:37:48,417] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. + 6: [2023-05-10 12:37:48,417] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... + 3: [2023-05-10 12:37:48,417] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt... +18: [2023-05-10 12:37:48,417] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. + 6: [2023-05-10 12:37:48,417] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. + 6: [2023-05-10 12:37:48,417] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. + 6: [2023-05-10 12:37:48,419] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. + 3: [2023-05-10 12:37:48,419] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +18: [2023-05-10 12:37:48,419] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +18: [2023-05-10 12:37:48,419] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. + 3: [2023-05-10 12:37:48,419] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt... + 7: [2023-05-10 12:37:48,420] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... + 5: [2023-05-10 12:37:48,420] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... + 3: [2023-05-10 12:37:48,420] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. + 3: [2023-05-10 12:37:48,420] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. + 7: [2023-05-10 12:37:48,420] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. + 7: [2023-05-10 12:37:48,420] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... + 4: [2023-05-10 12:37:48,420] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... + 5: [2023-05-10 12:37:48,420] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... + 1: [2023-05-10 12:37:48,421] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +22: [2023-05-10 12:37:48,420] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. + 7: [2023-05-10 12:37:48,421] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. + 4: [2023-05-10 12:37:48,421] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. + 4: [2023-05-10 12:37:48,421] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +22: [2023-05-10 12:37:48,421] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. + 5: [2023-05-10 12:37:48,421] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... + 1: [2023-05-10 12:37:48,421] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. + 1: [2023-05-10 12:37:48,421] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... + 4: [2023-05-10 12:37:48,421] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. + 1: [2023-05-10 12:37:48,421] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +29: [2023-05-10 12:37:48,422] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... + 6: [2023-05-10 12:37:48,423] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. + 5: [2023-05-10 12:37:48,423] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. + 5: [2023-05-10 12:37:48,423] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. + 5: [2023-05-10 12:37:48,423] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... + 5: [2023-05-10 12:37:48,424] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... + 5: [2023-05-10 12:37:48,424] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. + 5: [2023-05-10 12:37:48,424] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... + 5: [2023-05-10 12:37:48,424] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +25: [2023-05-10 12:37:48,424] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... + 5: [2023-05-10 12:37:48,424] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. + 5: [2023-05-10 12:37:48,424] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. + 3: [2023-05-10 12:37:48,424] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +29: [2023-05-10 12:37:48,425] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +29: [2023-05-10 12:37:48,425] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +29: [2023-05-10 12:37:48,425] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. + 5: [2023-05-10 12:37:48,426] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +29: [2023-05-10 12:37:48,426] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +25: [2023-05-10 12:37:48,427] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +25: [2023-05-10 12:37:48,427] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... + 0: [2023-05-10 12:37:48,427] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +25: [2023-05-10 12:37:48,427] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. + 6: [2023-05-10 12:37:48,427] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +18: [2023-05-10 12:37:48,428] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... + 6: [2023-05-10 12:37:48,428] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. + 6: [2023-05-10 12:37:48,428] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... + 6: [2023-05-10 12:37:48,428] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +25: [2023-05-10 12:37:48,429] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... + 0: [2023-05-10 12:37:48,429] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... + 0: [2023-05-10 12:37:48,430] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +18: [2023-05-10 12:37:48,430] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +25: [2023-05-10 12:37:48,430] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. + 9: [2023-05-10 12:37:48,430] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_38_mp_rank_00_optim_states.pt... + 9: [2023-05-10 12:37:48,430] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_39_mp_rank_00_optim_states.pt... + 9: [2023-05-10 12:37:48,430] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_37_mp_rank_00_optim_states.pt... + 9: [2023-05-10 12:37:48,430] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_36_mp_rank_00_optim_states.pt... +25: [2023-05-10 12:37:48,430] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... + 0: [2023-05-10 12:37:48,430] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +25: [2023-05-10 12:37:48,430] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. + 3: [2023-05-10 12:37:48,430] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... + 6: [2023-05-10 12:37:48,431] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +22: [2023-05-10 12:37:48,431] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +28: [2023-05-10 12:37:48,431] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_112_mp_rank_01_optim_states.pt... +28: [2023-05-10 12:37:48,431] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_113_mp_rank_01_optim_states.pt... +28: [2023-05-10 12:37:48,431] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_114_mp_rank_01_optim_states.pt... +28: [2023-05-10 12:37:48,431] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_115_mp_rank_01_optim_states.pt... +18: [2023-05-10 12:37:48,431] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... + 6: [2023-05-10 12:37:48,432] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. + 6: [2023-05-10 12:37:48,432] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +22: [2023-05-10 12:37:48,432] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... + 6: [2023-05-10 12:37:48,432] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +18: [2023-05-10 12:37:48,432] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +18: [2023-05-10 12:37:48,432] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +18: [2023-05-10 12:37:48,432] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... + 3: [2023-05-10 12:37:48,432] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +18: [2023-05-10 12:37:48,432] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... + 3: [2023-05-10 12:37:48,432] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +18: [2023-05-10 12:37:48,432] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. + 3: [2023-05-10 12:37:48,432] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +18: [2023-05-10 12:37:48,432] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +25: [2023-05-10 12:37:48,432] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +29: [2023-05-10 12:37:48,432] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +29: [2023-05-10 12:37:48,432] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +18: [2023-05-10 12:37:48,433] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. + 3: [2023-05-10 12:37:48,433] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +18: [2023-05-10 12:37:48,433] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +18: [2023-05-10 12:37:48,433] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. + 3: [2023-05-10 12:37:48,433] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. + 3: [2023-05-10 12:37:48,433] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... + 3: [2023-05-10 12:37:48,433] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. + 3: [2023-05-10 12:37:48,433] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... + 3: [2023-05-10 12:37:48,433] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. + 3: [2023-05-10 12:37:48,434] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. + 5: [2023-05-10 12:37:48,434] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +29: [2023-05-10 12:37:48,435] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... + 5: [2023-05-10 12:37:48,435] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. + 5: [2023-05-10 12:37:48,435] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +18: [2023-05-10 12:37:48,435] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +11: [2023-05-10 12:37:48,435] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_45_mp_rank_00_optim_states.pt... +11: [2023-05-10 12:37:48,435] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_46_mp_rank_00_optim_states.pt... + 5: [2023-05-10 12:37:48,435] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +11: [2023-05-10 12:37:48,435] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_44_mp_rank_00_optim_states.pt... +11: [2023-05-10 12:37:48,435] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_47_mp_rank_00_optim_states.pt... +29: [2023-05-10 12:37:48,435] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +29: [2023-05-10 12:37:48,435] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +29: [2023-05-10 12:37:48,436] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +22: [2023-05-10 12:37:48,436] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +26: [2023-05-10 12:37:48,437] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_104_mp_rank_01_optim_states.pt... +26: [2023-05-10 12:37:48,437] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_106_mp_rank_01_optim_states.pt... +26: [2023-05-10 12:37:48,437] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_105_mp_rank_01_optim_states.pt... +26: [2023-05-10 12:37:48,437] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_107_mp_rank_01_optim_states.pt... +22: [2023-05-10 12:37:48,437] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +25: [2023-05-10 12:37:48,439] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +25: [2023-05-10 12:37:48,441] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +21: [2023-05-10 12:37:48,441] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_84_mp_rank_00_optim_states.pt... +21: [2023-05-10 12:37:48,441] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_86_mp_rank_00_optim_states.pt... +21: [2023-05-10 12:37:48,441] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_85_mp_rank_00_optim_states.pt... +21: [2023-05-10 12:37:48,441] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_87_mp_rank_00_optim_states.pt... +29: [2023-05-10 12:37:48,442] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +29: [2023-05-10 12:37:48,442] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +25: [2023-05-10 12:37:48,442] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +25: [2023-05-10 12:37:48,442] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +29: [2023-05-10 12:37:48,442] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +29: [2023-05-10 12:37:48,442] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +29: [2023-05-10 12:37:48,442] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +29: [2023-05-10 12:37:48,442] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +25: [2023-05-10 12:37:48,442] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +29: [2023-05-10 12:37:48,442] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +29: [2023-05-10 12:37:48,442] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +18: [2023-05-10 12:37:48,444] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +18: [2023-05-10 12:37:48,444] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +18: [2023-05-10 12:37:48,444] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +18: [2023-05-10 12:37:48,444] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. + 3: [2023-05-10 12:37:48,445] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +22: [2023-05-10 12:37:48,447] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +22: [2023-05-10 12:37:48,447] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +22: [2023-05-10 12:37:48,447] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... + 7: [2023-05-10 12:37:48,447] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_29_mp_rank_00_optim_states.pt... + 7: [2023-05-10 12:37:48,447] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_31_mp_rank_00_optim_states.pt... + 7: [2023-05-10 12:37:48,447] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_28_mp_rank_00_optim_states.pt... + 7: [2023-05-10 12:37:48,447] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_30_mp_rank_00_optim_states.pt... +22: [2023-05-10 12:37:48,447] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +22: [2023-05-10 12:37:48,447] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +11: [2023-05-10 12:37:48,447] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt. +11: [2023-05-10 12:37:48,447] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt. + 0: [2023-05-10 12:37:48,447] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +22: [2023-05-10 12:37:48,447] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +11: [2023-05-10 12:37:48,447] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt. +11: [2023-05-10 12:37:48,447] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt. +22: [2023-05-10 12:37:48,448] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +22: [2023-05-10 12:37:48,448] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +22: [2023-05-10 12:37:48,448] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +22: [2023-05-10 12:37:48,448] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +22: [2023-05-10 12:37:48,448] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... + 0: [2023-05-10 12:37:48,448] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt... +22: [2023-05-10 12:37:48,448] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +22: [2023-05-10 12:37:48,448] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +22: [2023-05-10 12:37:48,448] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +25: [2023-05-10 12:37:48,448] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +27: [2023-05-10 12:37:48,449] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt. +27: [2023-05-10 12:37:48,449] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt. +27: [2023-05-10 12:37:48,449] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt. + 4: [2023-05-10 12:37:48,449] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_19_mp_rank_00_optim_states.pt... + 0: [2023-05-10 12:37:48,449] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. + 4: [2023-05-10 12:37:48,449] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_16_mp_rank_00_optim_states.pt... + 4: [2023-05-10 12:37:48,449] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_17_mp_rank_00_optim_states.pt... + 4: [2023-05-10 12:37:48,449] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_18_mp_rank_00_optim_states.pt... + 0: [2023-05-10 12:37:48,449] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt... +25: [2023-05-10 12:37:48,449] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +25: [2023-05-10 12:37:48,449] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +25: [2023-05-10 12:37:48,449] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +30: [2023-05-10 12:37:48,450] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_122_mp_rank_01_optim_states.pt... +30: [2023-05-10 12:37:48,450] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_120_mp_rank_01_optim_states.pt... +30: [2023-05-10 12:37:48,450] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_121_mp_rank_01_optim_states.pt... +30: [2023-05-10 12:37:48,450] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_123_mp_rank_01_optim_states.pt... +24: [2023-05-10 12:37:48,450] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_99_mp_rank_01_optim_states.pt... +24: [2023-05-10 12:37:48,450] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_98_mp_rank_01_optim_states.pt... +24: [2023-05-10 12:37:48,450] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_97_mp_rank_01_optim_states.pt... +24: [2023-05-10 12:37:48,450] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_96_mp_rank_01_optim_states.pt... +27: [2023-05-10 12:37:48,451] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt. +23: [2023-05-10 12:37:48,452] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_93_mp_rank_00_optim_states.pt... +23: [2023-05-10 12:37:48,452] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_94_mp_rank_00_optim_states.pt... +23: [2023-05-10 12:37:48,452] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_92_mp_rank_00_optim_states.pt... +23: [2023-05-10 12:37:48,452] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_95_mp_rank_00_optim_states.pt... + 6: [2023-05-10 12:37:48,454] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_25_mp_rank_00_optim_states.pt... + 6: [2023-05-10 12:37:48,454] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_26_mp_rank_00_optim_states.pt... + 6: [2023-05-10 12:37:48,454] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_27_mp_rank_00_optim_states.pt... + 6: [2023-05-10 12:37:48,454] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_24_mp_rank_00_optim_states.pt... + 3: [2023-05-10 12:37:48,455] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... + 1: [2023-05-10 12:37:48,455] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt... + 1: [2023-05-10 12:37:48,455] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt... + 1: [2023-05-10 12:37:48,455] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt... + 1: [2023-05-10 12:37:48,455] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt... + 3: [2023-05-10 12:37:48,455] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. + 3: [2023-05-10 12:37:48,455] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... + 3: [2023-05-10 12:37:48,455] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. + 0: [2023-05-10 12:37:48,456] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +11: [2023-05-10 12:37:48,458] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... + 0: [2023-05-10 12:37:48,458] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt... +27: [2023-05-10 12:37:48,459] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... + 0: [2023-05-10 12:37:48,459] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +11: [2023-05-10 12:37:48,460] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +27: [2023-05-10 12:37:48,460] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +27: [2023-05-10 12:37:48,460] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +27: [2023-05-10 12:37:48,460] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +11: [2023-05-10 12:37:48,461] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +11: [2023-05-10 12:37:48,461] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... + 0: [2023-05-10 12:37:48,462] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt... + 6: [2023-05-10 12:37:48,462] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt. + 6: [2023-05-10 12:37:48,462] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt. + 6: [2023-05-10 12:37:48,462] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt. + 6: [2023-05-10 12:37:48,462] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt. + 5: [2023-05-10 12:37:48,463] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_22_mp_rank_00_optim_states.pt... + 5: [2023-05-10 12:37:48,463] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_21_mp_rank_00_optim_states.pt... + 5: [2023-05-10 12:37:48,463] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_20_mp_rank_00_optim_states.pt... + 5: [2023-05-10 12:37:48,463] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_23_mp_rank_00_optim_states.pt... +29: [2023-05-10 12:37:48,466] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_118_mp_rank_00_optim_states.pt... +29: [2023-05-10 12:37:48,466] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_119_mp_rank_00_optim_states.pt... +29: [2023-05-10 12:37:48,466] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_116_mp_rank_00_optim_states.pt... +29: [2023-05-10 12:37:48,466] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_117_mp_rank_00_optim_states.pt... +25: [2023-05-10 12:37:48,469] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_103_mp_rank_00_optim_states.pt... +25: [2023-05-10 12:37:48,469] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_102_mp_rank_00_optim_states.pt... +25: [2023-05-10 12:37:48,469] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_101_mp_rank_00_optim_states.pt... +25: [2023-05-10 12:37:48,469] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_100_mp_rank_00_optim_states.pt... + 6: [2023-05-10 12:37:48,471] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... + 6: [2023-05-10 12:37:48,471] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +18: [2023-05-10 12:37:48,472] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt. +18: [2023-05-10 12:37:48,472] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt. +18: [2023-05-10 12:37:48,472] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt. + 6: [2023-05-10 12:37:48,472] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +18: [2023-05-10 12:37:48,472] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt. +11: [2023-05-10 12:37:48,472] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +11: [2023-05-10 12:37:48,473] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt... +21: [2023-05-10 12:37:48,473] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt. +21: [2023-05-10 12:37:48,473] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt. +21: [2023-05-10 12:37:48,473] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt. +21: [2023-05-10 12:37:48,473] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt. + 6: [2023-05-10 12:37:48,474] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... + 3: [2023-05-10 12:37:48,474] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt... + 3: [2023-05-10 12:37:48,474] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt... + 3: [2023-05-10 12:37:48,474] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt... + 3: [2023-05-10 12:37:48,474] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt... + 7: [2023-05-10 12:37:48,474] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt. + 7: [2023-05-10 12:37:48,475] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt. + 7: [2023-05-10 12:37:48,475] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt. + 2: [2023-05-10 12:37:48,475] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt. + 2: [2023-05-10 12:37:48,475] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt. + 2: [2023-05-10 12:37:48,475] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt. + 2: [2023-05-10 12:37:48,476] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt. + 7: [2023-05-10 12:37:48,476] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt. +17: [2023-05-10 12:37:48,476] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt. +17: [2023-05-10 12:37:48,476] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt. +17: [2023-05-10 12:37:48,476] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt. +11: [2023-05-10 12:37:48,476] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +11: [2023-05-10 12:37:48,476] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt... +18: [2023-05-10 12:37:48,477] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_74_mp_rank_00_optim_states.pt... +18: [2023-05-10 12:37:48,477] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_72_mp_rank_00_optim_states.pt... +18: [2023-05-10 12:37:48,477] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_75_mp_rank_00_optim_states.pt... +18: [2023-05-10 12:37:48,477] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_73_mp_rank_00_optim_states.pt... +17: [2023-05-10 12:37:48,477] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt. +27: [2023-05-10 12:37:48,477] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +27: [2023-05-10 12:37:48,478] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt... +11: [2023-05-10 12:37:48,478] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +11: [2023-05-10 12:37:48,478] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt... +27: [2023-05-10 12:37:48,479] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +27: [2023-05-10 12:37:48,480] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt... +14: [2023-05-10 12:37:48,480] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt. +14: [2023-05-10 12:37:48,480] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt. +14: [2023-05-10 12:37:48,480] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt. +18: [2023-05-10 12:37:48,481] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +14: [2023-05-10 12:37:48,481] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt. +18: [2023-05-10 12:37:48,482] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +18: [2023-05-10 12:37:48,482] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +22: [2023-05-10 12:37:48,483] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt. +22: [2023-05-10 12:37:48,483] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt. +22: [2023-05-10 12:37:48,483] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt. +22: [2023-05-10 12:37:48,484] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt. +18: [2023-05-10 12:37:48,484] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... + 7: [2023-05-10 12:37:48,484] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... + 2: [2023-05-10 12:37:48,484] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... + 2: [2023-05-10 12:37:48,485] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +21: [2023-05-10 12:37:48,485] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +21: [2023-05-10 12:37:48,485] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +27: [2023-05-10 12:37:48,485] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. + 7: [2023-05-10 12:37:48,486] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +22: [2023-05-10 12:37:48,486] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_88_mp_rank_00_optim_states.pt... +22: [2023-05-10 12:37:48,486] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_90_mp_rank_00_optim_states.pt... +22: [2023-05-10 12:37:48,486] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_89_mp_rank_00_optim_states.pt... +22: [2023-05-10 12:37:48,486] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_91_mp_rank_00_optim_states.pt... + 7: [2023-05-10 12:37:48,486] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +17: [2023-05-10 12:37:48,486] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +27: [2023-05-10 12:37:48,486] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt... + 2: [2023-05-10 12:37:48,487] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +27: [2023-05-10 12:37:48,487] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. + 2: [2023-05-10 12:37:48,487] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +21: [2023-05-10 12:37:48,487] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... + 7: [2023-05-10 12:37:48,487] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +21: [2023-05-10 12:37:48,487] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +17: [2023-05-10 12:37:48,488] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +27: [2023-05-10 12:37:48,488] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt... +17: [2023-05-10 12:37:48,489] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +17: [2023-05-10 12:37:48,489] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... + 6: [2023-05-10 12:37:48,489] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. + 6: [2023-05-10 12:37:48,489] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +14: [2023-05-10 12:37:48,489] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... + 6: [2023-05-10 12:37:48,490] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt... + 6: [2023-05-10 12:37:48,490] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt... +11: [2023-05-10 12:37:48,490] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +14: [2023-05-10 12:37:48,491] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +14: [2023-05-10 12:37:48,492] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +14: [2023-05-10 12:37:48,492] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +11: [2023-05-10 12:37:48,492] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt... +18: [2023-05-10 12:37:48,495] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +18: [2023-05-10 12:37:48,495] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt... +22: [2023-05-10 12:37:48,496] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +22: [2023-05-10 12:37:48,496] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... + 6: [2023-05-10 12:37:48,496] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. + 6: [2023-05-10 12:37:48,498] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt... +22: [2023-05-10 12:37:48,498] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +29: [2023-05-10 12:37:48,498] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt. +29: [2023-05-10 12:37:48,498] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt. +29: [2023-05-10 12:37:48,498] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt. +21: [2023-05-10 12:37:48,498] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +29: [2023-05-10 12:37:48,499] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt. +21: [2023-05-10 12:37:48,499] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt... + 7: [2023-05-10 12:37:48,499] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. + 7: [2023-05-10 12:37:48,500] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt... +22: [2023-05-10 12:37:48,500] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +25: [2023-05-10 12:37:48,500] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt. + 9: [2023-05-10 12:37:48,500] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt. +25: [2023-05-10 12:37:48,500] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt. +25: [2023-05-10 12:37:48,500] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt. + 9: [2023-05-10 12:37:48,500] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt. +25: [2023-05-10 12:37:48,501] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt. + 2: [2023-05-10 12:37:48,500] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. + 2: [2023-05-10 12:37:48,501] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt... + 9: [2023-05-10 12:37:48,501] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt. +20: [2023-05-10 12:37:48,501] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt. +20: [2023-05-10 12:37:48,501] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt. + 9: [2023-05-10 12:37:48,501] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt. +20: [2023-05-10 12:37:48,501] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt. +12: [2023-05-10 12:37:48,501] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt. +12: [2023-05-10 12:37:48,502] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt. +20: [2023-05-10 12:37:48,502] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt. +12: [2023-05-10 12:37:48,502] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt. +12: [2023-05-10 12:37:48,502] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt. +19: [2023-05-10 12:37:48,502] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt. +19: [2023-05-10 12:37:48,502] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt. +18: [2023-05-10 12:37:48,502] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +18: [2023-05-10 12:37:48,502] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +14: [2023-05-10 12:37:48,502] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +18: [2023-05-10 12:37:48,503] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt... +18: [2023-05-10 12:37:48,503] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt... +19: [2023-05-10 12:37:48,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt. + 6: [2023-05-10 12:37:48,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. + 2: [2023-05-10 12:37:48,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. + 7: [2023-05-10 12:37:48,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. + 2: [2023-05-10 12:37:48,503] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt... + 7: [2023-05-10 12:37:48,503] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt... +19: [2023-05-10 12:37:48,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt. +14: [2023-05-10 12:37:48,503] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt... +21: [2023-05-10 12:37:48,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +21: [2023-05-10 12:37:48,503] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt... +13: [2023-05-10 12:37:48,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt. +13: [2023-05-10 12:37:48,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt. +13: [2023-05-10 12:37:48,504] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt. +13: [2023-05-10 12:37:48,504] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt. +17: [2023-05-10 12:37:48,504] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. + 6: [2023-05-10 12:37:48,504] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt... +17: [2023-05-10 12:37:48,504] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +17: [2023-05-10 12:37:48,504] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt... +17: [2023-05-10 12:37:48,505] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt... +14: [2023-05-10 12:37:48,506] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +14: [2023-05-10 12:37:48,506] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt... + 4: [2023-05-10 12:37:48,507] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt. + 4: [2023-05-10 12:37:48,507] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt. + 4: [2023-05-10 12:37:48,507] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt. +15: [2023-05-10 12:37:48,507] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt. +15: [2023-05-10 12:37:48,507] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt. +15: [2023-05-10 12:37:48,507] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt. +17: [2023-05-10 12:37:48,508] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +29: [2023-05-10 12:37:48,508] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... + 4: [2023-05-10 12:37:48,508] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt. +17: [2023-05-10 12:37:48,508] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt... +15: [2023-05-10 12:37:48,508] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt. +18: [2023-05-10 12:37:48,508] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +16: [2023-05-10 12:37:48,508] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt. +16: [2023-05-10 12:37:48,508] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt. +31: [2023-05-10 12:37:48,508] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt. +16: [2023-05-10 12:37:48,508] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt. +31: [2023-05-10 12:37:48,508] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt. +31: [2023-05-10 12:37:48,508] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt. +16: [2023-05-10 12:37:48,508] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt. +29: [2023-05-10 12:37:48,509] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +31: [2023-05-10 12:37:48,509] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_35-model_01-model_states.pt. +18: [2023-05-10 12:37:48,510] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt... + 9: [2023-05-10 12:37:48,510] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... + 7: [2023-05-10 12:37:48,510] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. + 1: [2023-05-10 12:37:48,510] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt. + 1: [2023-05-10 12:37:48,510] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt. + 1: [2023-05-10 12:37:48,510] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt. +20: [2023-05-10 12:37:48,510] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +29: [2023-05-10 12:37:48,510] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... + 1: [2023-05-10 12:37:48,510] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt. +29: [2023-05-10 12:37:48,511] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +14: [2023-05-10 12:37:48,511] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_56_mp_rank_00_optim_states.pt. +14: [2023-05-10 12:37:48,511] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 112 + 9: [2023-05-10 12:37:48,511] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +21: [2023-05-10 12:37:48,511] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. + 7: [2023-05-10 12:37:48,511] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt... + 9: [2023-05-10 12:37:48,511] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +21: [2023-05-10 12:37:48,512] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +25: [2023-05-10 12:37:48,512] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +12: [2023-05-10 12:37:48,512] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +25: [2023-05-10 12:37:48,512] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +19: [2023-05-10 12:37:48,512] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +14: [2023-05-10 12:37:48,512] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +25: [2023-05-10 12:37:48,512] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +14: [2023-05-10 12:37:48,512] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt... +21: [2023-05-10 12:37:48,513] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt... + 7: [2023-05-10 12:37:48,512] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +25: [2023-05-10 12:37:48,513] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... + 9: [2023-05-10 12:37:48,513] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +19: [2023-05-10 12:37:48,513] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +20: [2023-05-10 12:37:48,513] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +20: [2023-05-10 12:37:48,513] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +13: [2023-05-10 12:37:48,513] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +20: [2023-05-10 12:37:48,513] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +21: [2023-05-10 12:37:48,513] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt... +13: [2023-05-10 12:37:48,514] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +12: [2023-05-10 12:37:48,514] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +12: [2023-05-10 12:37:48,514] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +12: [2023-05-10 12:37:48,514] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +13: [2023-05-10 12:37:48,514] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... + 7: [2023-05-10 12:37:48,514] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt... +22: [2023-05-10 12:37:48,515] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +19: [2023-05-10 12:37:48,515] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +19: [2023-05-10 12:37:48,515] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +14: [2023-05-10 12:37:48,515] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 112 +14: [2023-05-10 12:37:48,516] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. + 2: [2023-05-10 12:37:48,516] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. + 4: [2023-05-10 12:37:48,516] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... + 4: [2023-05-10 12:37:48,516] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +22: [2023-05-10 12:37:48,517] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt... + 2: [2023-05-10 12:37:48,517] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. + 4: [2023-05-10 12:37:48,517] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... + 4: [2023-05-10 12:37:48,517] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +14: [2023-05-10 12:37:48,517] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt... +13: [2023-05-10 12:37:48,518] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... + 2: [2023-05-10 12:37:48,518] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt... +16: [2023-05-10 12:37:48,518] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +15: [2023-05-10 12:37:48,518] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +15: [2023-05-10 12:37:48,518] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +15: [2023-05-10 12:37:48,519] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. + 2: [2023-05-10 12:37:48,519] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt... +15: [2023-05-10 12:37:48,519] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +15: [2023-05-10 12:37:48,519] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +31: [2023-05-10 12:37:48,519] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +15: [2023-05-10 12:37:48,519] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt... + 1: [2023-05-10 12:37:48,519] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +15: [2023-05-10 12:37:48,519] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt... +15: [2023-05-10 12:37:48,519] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +16: [2023-05-10 12:37:48,519] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +15: [2023-05-10 12:37:48,519] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. + 1: [2023-05-10 12:37:48,519] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +31: [2023-05-10 12:37:48,519] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +15: [2023-05-10 12:37:48,519] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt... +17: [2023-05-10 12:37:48,519] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. + 1: [2023-05-10 12:37:48,520] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +15: [2023-05-10 12:37:48,520] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +15: [2023-05-10 12:37:48,520] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt... + 1: [2023-05-10 12:37:48,520] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +22: [2023-05-10 12:37:48,520] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. + 1: [2023-05-10 12:37:48,520] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +22: [2023-05-10 12:37:48,520] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt... + 1: [2023-05-10 12:37:48,520] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt... +16: [2023-05-10 12:37:48,520] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... + 1: [2023-05-10 12:37:48,520] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt... + 1: [2023-05-10 12:37:48,520] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. + 1: [2023-05-10 12:37:48,520] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt... +16: [2023-05-10 12:37:48,520] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +31: [2023-05-10 12:37:48,521] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... +29: [2023-05-10 12:37:48,521] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +29: [2023-05-10 12:37:48,521] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt... +17: [2023-05-10 12:37:48,521] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt... +31: [2023-05-10 12:37:48,521] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt... + 1: [2023-05-10 12:37:48,522] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... + 1: [2023-05-10 12:37:48,522] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. + 1: [2023-05-10 12:37:48,522] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt... +15: [2023-05-10 12:37:48,522] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt. +15: [2023-05-10 12:37:48,522] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt. +20: [2023-05-10 12:37:48,522] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +15: [2023-05-10 12:37:48,522] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt. + 1: [2023-05-10 12:37:48,523] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt. + 1: [2023-05-10 12:37:48,523] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt. +31: [2023-05-10 12:37:48,523] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_124_mp_rank_00_optim_states.pt. + 1: [2023-05-10 12:37:48,523] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt. +31: [2023-05-10 12:37:48,523] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 248 + 1: [2023-05-10 12:37:48,523] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt. +20: [2023-05-10 12:37:48,523] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt... +22: [2023-05-10 12:37:48,523] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +10: [2023-05-10 12:37:48,525] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt. +10: [2023-05-10 12:37:48,525] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt. +25: [2023-05-10 12:37:48,524] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +10: [2023-05-10 12:37:48,525] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt. +10: [2023-05-10 12:37:48,525] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt. +12: [2023-05-10 12:37:48,525] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +25: [2023-05-10 12:37:48,525] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +22: [2023-05-10 12:37:48,525] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt... +29: [2023-05-10 12:37:48,525] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +29: [2023-05-10 12:37:48,526] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt... +25: [2023-05-10 12:37:48,526] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt... +25: [2023-05-10 12:37:48,526] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt... +19: [2023-05-10 12:37:48,526] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +22: [2023-05-10 12:37:48,527] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +13: [2023-05-10 12:37:48,526] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +25: [2023-05-10 12:37:48,527] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +31: [2023-05-10 12:37:48,527] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 248 +19: [2023-05-10 12:37:48,527] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt... +25: [2023-05-10 12:37:48,527] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt... +20: [2023-05-10 12:37:48,527] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +20: [2023-05-10 12:37:48,527] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt... +12: [2023-05-10 12:37:48,527] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +25: [2023-05-10 12:37:48,527] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +13: [2023-05-10 12:37:48,528] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +12: [2023-05-10 12:37:48,528] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt... +12: [2023-05-10 12:37:48,528] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +15: [2023-05-10 12:37:48,528] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt. +12: [2023-05-10 12:37:48,528] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt... +22: [2023-05-10 12:37:48,529] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt... +12: [2023-05-10 12:37:48,529] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt... +13: [2023-05-10 12:37:48,529] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt... +25: [2023-05-10 12:37:48,529] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt... +13: [2023-05-10 12:37:48,529] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt... + 9: [2023-05-10 12:37:48,531] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. + 9: [2023-05-10 12:37:48,531] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +19: [2023-05-10 12:37:48,531] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +19: [2023-05-10 12:37:48,531] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt... + 9: [2023-05-10 12:37:48,531] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt... +20: [2023-05-10 12:37:48,531] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. + 9: [2023-05-10 12:37:48,531] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt... +20: [2023-05-10 12:37:48,531] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt... +19: [2023-05-10 12:37:48,531] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +19: [2023-05-10 12:37:48,532] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt... + 9: [2023-05-10 12:37:48,532] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. + 9: [2023-05-10 12:37:48,532] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. + 9: [2023-05-10 12:37:48,532] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt... + 9: [2023-05-10 12:37:48,532] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt... +16: [2023-05-10 12:37:48,532] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +16: [2023-05-10 12:37:48,533] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt... +13: [2023-05-10 12:37:48,533] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +13: [2023-05-10 12:37:48,533] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt... +20: [2023-05-10 12:37:48,533] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +20: [2023-05-10 12:37:48,533] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt... +10: [2023-05-10 12:37:48,534] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... + 4: [2023-05-10 12:37:48,534] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. + 4: [2023-05-10 12:37:48,534] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +31: [2023-05-10 12:37:48,535] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +10: [2023-05-10 12:37:48,535] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +10: [2023-05-10 12:37:48,535] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... + 4: [2023-05-10 12:37:48,535] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt... + 4: [2023-05-10 12:37:48,535] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt... +12: [2023-05-10 12:37:48,535] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +10: [2023-05-10 12:37:48,535] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +12: [2023-05-10 12:37:48,535] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt... +31: [2023-05-10 12:37:48,535] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt... +10: [2023-05-10 12:37:48,535] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt... +10: [2023-05-10 12:37:48,536] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +10: [2023-05-10 12:37:48,536] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt... +10: [2023-05-10 12:37:48,536] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +10: [2023-05-10 12:37:48,536] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt... +19: [2023-05-10 12:37:48,536] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +19: [2023-05-10 12:37:48,537] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt... +10: [2023-05-10 12:37:48,537] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +29: [2023-05-10 12:37:48,537] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +10: [2023-05-10 12:37:48,537] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +10: [2023-05-10 12:37:48,538] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt... +10: [2023-05-10 12:37:48,538] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt. +10: [2023-05-10 12:37:48,538] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt. +10: [2023-05-10 12:37:48,538] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt. +10: [2023-05-10 12:37:48,538] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt. +29: [2023-05-10 12:37:48,539] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt... + 4: [2023-05-10 12:37:48,539] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. + 4: [2023-05-10 12:37:48,539] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. + 4: [2023-05-10 12:37:48,539] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt... + 4: [2023-05-10 12:37:48,539] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt... +16: [2023-05-10 12:37:48,541] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. + 2: [2023-05-10 12:37:48,541] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt. + 2: [2023-05-10 12:37:48,541] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 20 +13: [2023-05-10 12:37:48,542] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +16: [2023-05-10 12:37:48,542] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt... +29: [2023-05-10 12:37:48,542] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +13: [2023-05-10 12:37:48,543] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt... +16: [2023-05-10 12:37:48,544] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +31: [2023-05-10 12:37:48,544] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +29: [2023-05-10 12:37:48,545] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt... +31: [2023-05-10 12:37:48,546] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt... +16: [2023-05-10 12:37:48,546] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt... + 2: [2023-05-10 12:37:48,546] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 20 +31: [2023-05-10 12:37:48,549] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +24: [2023-05-10 12:37:48,547] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_97_mp_rank_00_optim_states.pt. +16: [2023-05-10 12:37:48,549] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +24: [2023-05-10 12:37:48,547] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 194 +23: [2023-05-10 12:37:48,549] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt. +23: [2023-05-10 12:37:48,549] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt. +23: [2023-05-10 12:37:48,549] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt. +23: [2023-05-10 12:37:48,549] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt. +31: [2023-05-10 12:37:48,550] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_00-model_states.pt. +31: [2023-05-10 12:37:48,550] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt... +16: [2023-05-10 12:37:48,551] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt... +31: [2023-05-10 12:37:48,551] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt... +24: [2023-05-10 12:37:48,552] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 194 +23: [2023-05-10 12:37:48,558] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +23: [2023-05-10 12:37:48,558] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +23: [2023-05-10 12:37:48,559] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +23: [2023-05-10 12:37:48,559] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +23: [2023-05-10 12:37:48,559] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt... +23: [2023-05-10 12:37:48,559] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt... + 5: [2023-05-10 12:37:48,559] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt. +23: [2023-05-10 12:37:48,562] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +23: [2023-05-10 12:37:48,562] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... + 5: [2023-05-10 12:37:48,562] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt. +23: [2023-05-10 12:37:48,562] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +23: [2023-05-10 12:37:48,562] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +23: [2023-05-10 12:37:48,562] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt... +23: [2023-05-10 12:37:48,562] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt... + 5: [2023-05-10 12:37:48,562] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt. + 5: [2023-05-10 12:37:48,563] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt. +23: [2023-05-10 12:37:48,563] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt. +23: [2023-05-10 12:37:48,563] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt. +23: [2023-05-10 12:37:48,563] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt. +23: [2023-05-10 12:37:48,563] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt. + 8: [2023-05-10 12:37:48,567] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_35_mp_rank_00_optim_states.pt. + 8: [2023-05-10 12:37:48,567] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 70 +24: [2023-05-10 12:37:48,569] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_96_mp_rank_00_optim_states.pt. +24: [2023-05-10 12:37:48,569] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 192 + 5: [2023-05-10 12:37:48,569] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... + 5: [2023-05-10 12:37:48,570] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. + 5: [2023-05-10 12:37:48,570] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt... + 8: [2023-05-10 12:37:48,571] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 70 + 5: [2023-05-10 12:37:48,572] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... + 5: [2023-05-10 12:37:48,572] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... + 5: [2023-05-10 12:37:48,573] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. + 5: [2023-05-10 12:37:48,573] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt... + 5: [2023-05-10 12:37:48,573] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. + 5: [2023-05-10 12:37:48,573] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt... +24: [2023-05-10 12:37:48,574] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 192 + 5: [2023-05-10 12:37:48,574] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... + 5: [2023-05-10 12:37:48,575] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. + 5: [2023-05-10 12:37:48,575] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt... +15: [2023-05-10 12:37:48,576] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_60_mp_rank_01_optim_states.pt... +15: [2023-05-10 12:37:48,576] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_62_mp_rank_01_optim_states.pt... +15: [2023-05-10 12:37:48,576] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_61_mp_rank_01_optim_states.pt... +15: [2023-05-10 12:37:48,576] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_63_mp_rank_01_optim_states.pt... + 5: [2023-05-10 12:37:48,577] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt. + 5: [2023-05-10 12:37:48,577] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt. + 5: [2023-05-10 12:37:48,577] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt. + 5: [2023-05-10 12:37:48,579] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt. + 1: [2023-05-10 12:37:48,580] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_7_mp_rank_01_optim_states.pt... + 1: [2023-05-10 12:37:48,580] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_5_mp_rank_01_optim_states.pt... + 1: [2023-05-10 12:37:48,580] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_4_mp_rank_01_optim_states.pt... + 1: [2023-05-10 12:37:48,580] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_6_mp_rank_01_optim_states.pt... +24: [2023-05-10 12:37:48,581] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_98_mp_rank_00_optim_states.pt. +24: [2023-05-10 12:37:48,581] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 196 +24: [2023-05-10 12:37:48,585] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 196 +24: [2023-05-10 12:37:48,586] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_99_mp_rank_00_optim_states.pt. +24: [2023-05-10 12:37:48,587] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 198 +24: [2023-05-10 12:37:48,591] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 198 +10: [2023-05-10 12:37:48,597] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_40_mp_rank_01_optim_states.pt... +10: [2023-05-10 12:37:48,597] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_43_mp_rank_01_optim_states.pt... +10: [2023-05-10 12:37:48,597] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_41_mp_rank_01_optim_states.pt... +10: [2023-05-10 12:37:48,597] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_42_mp_rank_01_optim_states.pt... + 8: [2023-05-10 12:37:48,606] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_32_mp_rank_00_optim_states.pt. +30: [2023-05-10 12:37:48,606] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_123_mp_rank_00_optim_states.pt. +30: [2023-05-10 12:37:48,606] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 246 +17: [2023-05-10 12:37:48,607] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_69_mp_rank_00_optim_states.pt. + 8: [2023-05-10 12:37:48,606] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 64 +17: [2023-05-10 12:37:48,607] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 138 + 8: [2023-05-10 12:37:48,609] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt. + 8: [2023-05-10 12:37:48,609] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt. + 8: [2023-05-10 12:37:48,609] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt. + 8: [2023-05-10 12:37:48,609] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt. +30: [2023-05-10 12:37:48,610] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 246 + 8: [2023-05-10 12:37:48,611] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 64 +17: [2023-05-10 12:37:48,611] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 138 +28: [2023-05-10 12:37:48,617] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_113_mp_rank_00_optim_states.pt. +28: [2023-05-10 12:37:48,617] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 226 + 5: [2023-05-10 12:37:48,617] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_20_mp_rank_01_optim_states.pt... + 5: [2023-05-10 12:37:48,617] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_23_mp_rank_01_optim_states.pt... + 5: [2023-05-10 12:37:48,617] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_21_mp_rank_01_optim_states.pt... + 5: [2023-05-10 12:37:48,617] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_22_mp_rank_01_optim_states.pt... + 8: [2023-05-10 12:37:48,618] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... + 8: [2023-05-10 12:37:48,618] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. + 8: [2023-05-10 12:37:48,618] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... + 8: [2023-05-10 12:37:48,619] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. + 8: [2023-05-10 12:37:48,619] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... + 8: [2023-05-10 12:37:48,619] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... + 8: [2023-05-10 12:37:48,620] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. + 8: [2023-05-10 12:37:48,620] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. + 3: [2023-05-10 12:37:48,620] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt. + 3: [2023-05-10 12:37:48,620] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt. + 3: [2023-05-10 12:37:48,620] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt. + 3: [2023-05-10 12:37:48,620] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt. + 8: [2023-05-10 12:37:48,621] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt... + 8: [2023-05-10 12:37:48,621] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt... + 8: [2023-05-10 12:37:48,621] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt... + 8: [2023-05-10 12:37:48,621] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt... +28: [2023-05-10 12:37:48,621] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 226 +14: [2023-05-10 12:37:48,621] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_58_mp_rank_00_optim_states.pt. +14: [2023-05-10 12:37:48,622] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 116 + 8: [2023-05-10 12:37:48,623] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt. +23: [2023-05-10 12:37:48,623] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_94_mp_rank_01_optim_states.pt... +23: [2023-05-10 12:37:48,623] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_95_mp_rank_01_optim_states.pt... +23: [2023-05-10 12:37:48,623] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_92_mp_rank_01_optim_states.pt... +23: [2023-05-10 12:37:48,623] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_93_mp_rank_01_optim_states.pt... +14: [2023-05-10 12:37:48,626] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 116 + 8: [2023-05-10 12:37:48,623] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt. + 8: [2023-05-10 12:37:48,623] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt. + 8: [2023-05-10 12:37:48,624] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt. + 3: [2023-05-10 12:37:48,629] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... + 3: [2023-05-10 12:37:48,629] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... + 3: [2023-05-10 12:37:48,629] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... + 3: [2023-05-10 12:37:48,630] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. + 3: [2023-05-10 12:37:48,630] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. + 3: [2023-05-10 12:37:48,630] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. + 3: [2023-05-10 12:37:48,630] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... + 3: [2023-05-10 12:37:48,630] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +31: [2023-05-10 12:37:48,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_125_mp_rank_00_optim_states.pt. + 0: [2023-05-10 12:37:48,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt. + 0: [2023-05-10 12:37:48,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt. +31: [2023-05-10 12:37:48,631] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 250 + 3: [2023-05-10 12:37:48,633] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt... + 3: [2023-05-10 12:37:48,633] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt... + 3: [2023-05-10 12:37:48,633] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt... + 3: [2023-05-10 12:37:48,633] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt... + 3: [2023-05-10 12:37:48,635] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt. + 3: [2023-05-10 12:37:48,636] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt. + 3: [2023-05-10 12:37:48,636] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt. + 3: [2023-05-10 12:37:48,636] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt. +31: [2023-05-10 12:37:48,636] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 250 +12: [2023-05-10 12:37:48,638] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_50_mp_rank_00_optim_states.pt. + 0: [2023-05-10 12:37:48,638] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt. +12: [2023-05-10 12:37:48,638] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 100 + 0: [2023-05-10 12:37:48,638] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt. +31: [2023-05-10 12:37:48,641] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_126_mp_rank_00_optim_states.pt. +31: [2023-05-10 12:37:48,641] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 252 +12: [2023-05-10 12:37:48,642] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 100 +14: [2023-05-10 12:37:48,643] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_59_mp_rank_00_optim_states.pt. +14: [2023-05-10 12:37:48,643] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 118 + 0: [2023-05-10 12:37:48,643] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... + 2: [2023-05-10 12:37:48,643] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt. + 2: [2023-05-10 12:37:48,644] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 22 +31: [2023-05-10 12:37:48,644] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_127_mp_rank_00_optim_states.pt. + 0: [2023-05-10 12:37:48,644] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +31: [2023-05-10 12:37:48,644] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 254 + 0: [2023-05-10 12:37:48,644] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... + 0: [2023-05-10 12:37:48,645] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +31: [2023-05-10 12:37:48,645] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 252 + 2: [2023-05-10 12:37:48,645] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_9_mp_rank_00_optim_states.pt. + 2: [2023-05-10 12:37:48,646] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 18 +26: [2023-05-10 12:37:48,647] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_107_mp_rank_00_optim_states.pt. +26: [2023-05-10 12:37:48,647] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 214 +14: [2023-05-10 12:37:48,648] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 118 + 2: [2023-05-10 12:37:48,648] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 22 + 0: [2023-05-10 12:37:48,648] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +31: [2023-05-10 12:37:48,649] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 254 + 0: [2023-05-10 12:37:48,649] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. + 0: [2023-05-10 12:37:48,649] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt... + 0: [2023-05-10 12:37:48,649] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... + 0: [2023-05-10 12:37:48,650] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt... + 0: [2023-05-10 12:37:48,650] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt... + 0: [2023-05-10 12:37:48,650] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. + 0: [2023-05-10 12:37:48,650] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt... +14: [2023-05-10 12:37:48,650] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_57_mp_rank_00_optim_states.pt. + 2: [2023-05-10 12:37:48,650] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 18 +14: [2023-05-10 12:37:48,650] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 114 +26: [2023-05-10 12:37:48,651] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 214 + 8: [2023-05-10 12:37:48,653] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_33_mp_rank_00_optim_states.pt. + 8: [2023-05-10 12:37:48,653] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 66 + 0: [2023-05-10 12:37:48,654] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt. + 0: [2023-05-10 12:37:48,654] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt. + 0: [2023-05-10 12:37:48,654] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt. +14: [2023-05-10 12:37:48,654] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 114 + 0: [2023-05-10 12:37:48,655] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt. + 8: [2023-05-10 12:37:48,658] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 66 + 8: [2023-05-10 12:37:48,667] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_32_mp_rank_01_optim_states.pt... + 8: [2023-05-10 12:37:48,667] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_34_mp_rank_01_optim_states.pt... + 8: [2023-05-10 12:37:48,667] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_35_mp_rank_01_optim_states.pt... + 8: [2023-05-10 12:37:48,667] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_33_mp_rank_01_optim_states.pt... +27: [2023-05-10 12:37:48,670] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_111_mp_rank_00_optim_states.pt. +27: [2023-05-10 12:37:48,670] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 222 +27: [2023-05-10 12:37:48,675] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 222 +18: [2023-05-10 12:37:48,675] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt. +18: [2023-05-10 12:37:48,675] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt. + 3: [2023-05-10 12:37:48,677] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_14_mp_rank_01_optim_states.pt... + 3: [2023-05-10 12:37:48,677] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_15_mp_rank_01_optim_states.pt... + 3: [2023-05-10 12:37:48,677] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_13_mp_rank_01_optim_states.pt... + 3: [2023-05-10 12:37:48,677] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_12_mp_rank_01_optim_states.pt... +18: [2023-05-10 12:37:48,677] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt. +18: [2023-05-10 12:37:48,678] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt. +30: [2023-05-10 12:37:48,679] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_121_mp_rank_00_optim_states.pt. +30: [2023-05-10 12:37:48,679] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 242 +26: [2023-05-10 12:37:48,683] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_105_mp_rank_00_optim_states.pt. +26: [2023-05-10 12:37:48,683] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 210 +30: [2023-05-10 12:37:48,684] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 242 +30: [2023-05-10 12:37:48,684] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_120_mp_rank_00_optim_states.pt. +30: [2023-05-10 12:37:48,685] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 240 +18: [2023-05-10 12:37:48,685] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +18: [2023-05-10 12:37:48,685] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +18: [2023-05-10 12:37:48,685] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +18: [2023-05-10 12:37:48,686] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +18: [2023-05-10 12:37:48,686] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +18: [2023-05-10 12:37:48,686] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +18: [2023-05-10 12:37:48,687] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt... +18: [2023-05-10 12:37:48,687] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt... +18: [2023-05-10 12:37:48,687] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt... +26: [2023-05-10 12:37:48,687] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 210 +28: [2023-05-10 12:37:48,688] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_115_mp_rank_00_optim_states.pt. +28: [2023-05-10 12:37:48,688] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 230 +30: [2023-05-10 12:37:48,689] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 240 +18: [2023-05-10 12:37:48,689] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt. +18: [2023-05-10 12:37:48,689] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt. +18: [2023-05-10 12:37:48,689] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt. +18: [2023-05-10 12:37:48,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +18: [2023-05-10 12:37:48,691] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +18: [2023-05-10 12:37:48,691] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt... +18: [2023-05-10 12:37:48,691] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt. +28: [2023-05-10 12:37:48,692] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 230 + 0: [2023-05-10 12:37:48,693] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt. + 0: [2023-05-10 12:37:48,694] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 6 +12: [2023-05-10 12:37:48,695] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_48_mp_rank_00_optim_states.pt. +12: [2023-05-10 12:37:48,696] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 96 +15: [2023-05-10 12:37:48,698] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_60_mp_rank_00_optim_states.pt. +15: [2023-05-10 12:37:48,698] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 120 +22: [2023-05-10 12:37:48,698] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt. +22: [2023-05-10 12:37:48,698] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt. +15: [2023-05-10 12:37:48,699] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_61_mp_rank_00_optim_states.pt. +15: [2023-05-10 12:37:48,699] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 122 + 0: [2023-05-10 12:37:48,699] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 6 +22: [2023-05-10 12:37:48,699] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt. +22: [2023-05-10 12:37:48,699] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt. +12: [2023-05-10 12:37:48,700] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 96 +27: [2023-05-10 12:37:48,702] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_110_mp_rank_00_optim_states.pt. +27: [2023-05-10 12:37:48,702] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 220 +15: [2023-05-10 12:37:48,703] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 120 +15: [2023-05-10 12:37:48,703] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 122 +14: [2023-05-10 12:37:48,705] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt. +14: [2023-05-10 12:37:48,705] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt. +14: [2023-05-10 12:37:48,705] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt. +14: [2023-05-10 12:37:48,705] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt. +21: [2023-05-10 12:37:48,706] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt. +21: [2023-05-10 12:37:48,706] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt. +27: [2023-05-10 12:37:48,706] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 220 +21: [2023-05-10 12:37:48,708] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt. +21: [2023-05-10 12:37:48,709] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt. +22: [2023-05-10 12:37:48,712] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... + 0: [2023-05-10 12:37:48,712] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_2_mp_rank_01_optim_states.pt... + 0: [2023-05-10 12:37:48,712] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_3_mp_rank_01_optim_states.pt... + 0: [2023-05-10 12:37:48,712] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_1_mp_rank_01_optim_states.pt... + 0: [2023-05-10 12:37:48,712] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_0_mp_rank_01_optim_states.pt... +22: [2023-05-10 12:37:48,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +22: [2023-05-10 12:37:48,713] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +22: [2023-05-10 12:37:48,713] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +22: [2023-05-10 12:37:48,713] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +22: [2023-05-10 12:37:48,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +22: [2023-05-10 12:37:48,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +22: [2023-05-10 12:37:48,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +22: [2023-05-10 12:37:48,714] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt... +22: [2023-05-10 12:37:48,714] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt... +22: [2023-05-10 12:37:48,714] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt... +22: [2023-05-10 12:37:48,714] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt... +14: [2023-05-10 12:37:48,714] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +14: [2023-05-10 12:37:48,715] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +14: [2023-05-10 12:37:48,715] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +14: [2023-05-10 12:37:48,715] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... + 7: [2023-05-10 12:37:48,715] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt. + 7: [2023-05-10 12:37:48,715] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt. + 7: [2023-05-10 12:37:48,715] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt. +14: [2023-05-10 12:37:48,715] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +14: [2023-05-10 12:37:48,715] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +14: [2023-05-10 12:37:48,715] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +14: [2023-05-10 12:37:48,715] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt... +21: [2023-05-10 12:37:48,715] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +14: [2023-05-10 12:37:48,715] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt... +14: [2023-05-10 12:37:48,715] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt... +14: [2023-05-10 12:37:48,716] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +14: [2023-05-10 12:37:48,716] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt... +21: [2023-05-10 12:37:48,716] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. + 7: [2023-05-10 12:37:48,716] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt. + 6: [2023-05-10 12:37:48,717] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt. + 6: [2023-05-10 12:37:48,717] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt. + 6: [2023-05-10 12:37:48,717] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt. +21: [2023-05-10 12:37:48,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt... +22: [2023-05-10 12:37:48,717] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt. +22: [2023-05-10 12:37:48,717] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt. +22: [2023-05-10 12:37:48,717] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt. +21: [2023-05-10 12:37:48,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +14: [2023-05-10 12:37:48,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt. +14: [2023-05-10 12:37:48,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt. +14: [2023-05-10 12:37:48,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt. +22: [2023-05-10 12:37:48,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt. +14: [2023-05-10 12:37:48,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt. +21: [2023-05-10 12:37:48,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +21: [2023-05-10 12:37:48,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt... +21: [2023-05-10 12:37:48,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +21: [2023-05-10 12:37:48,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +21: [2023-05-10 12:37:48,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt... +21: [2023-05-10 12:37:48,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +16: [2023-05-10 12:37:48,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_66_mp_rank_00_optim_states.pt. +21: [2023-05-10 12:37:48,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +16: [2023-05-10 12:37:48,719] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 132 +21: [2023-05-10 12:37:48,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt... + 6: [2023-05-10 12:37:48,720] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt. +21: [2023-05-10 12:37:48,722] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt. +17: [2023-05-10 12:37:48,722] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt. +17: [2023-05-10 12:37:48,722] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt. +17: [2023-05-10 12:37:48,722] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt. +21: [2023-05-10 12:37:48,722] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt. +21: [2023-05-10 12:37:48,722] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt. +17: [2023-05-10 12:37:48,722] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt. +17: [2023-05-10 12:37:48,722] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_70_mp_rank_00_optim_states.pt. +17: [2023-05-10 12:37:48,723] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 140 +16: [2023-05-10 12:37:48,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_67_mp_rank_00_optim_states.pt. +16: [2023-05-10 12:37:48,723] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 134 +21: [2023-05-10 12:37:48,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt. +16: [2023-05-10 12:37:48,723] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 132 +27: [2023-05-10 12:37:48,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt. +27: [2023-05-10 12:37:48,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt. +28: [2023-05-10 12:37:48,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_114_mp_rank_00_optim_states.pt. +27: [2023-05-10 12:37:48,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt. +28: [2023-05-10 12:37:48,724] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 228 +27: [2023-05-10 12:37:48,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt. +26: [2023-05-10 12:37:48,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_106_mp_rank_00_optim_states.pt. +26: [2023-05-10 12:37:48,724] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 212 + 2: [2023-05-10 12:37:48,725] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt. + 2: [2023-05-10 12:37:48,725] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt. + 2: [2023-05-10 12:37:48,725] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt. + 2: [2023-05-10 12:37:48,725] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt. +10: [2023-05-10 12:37:48,725] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_42_mp_rank_00_optim_states.pt. + 7: [2023-05-10 12:37:48,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +10: [2023-05-10 12:37:48,725] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 84 + 7: [2023-05-10 12:37:48,726] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... + 7: [2023-05-10 12:37:48,726] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... + 7: [2023-05-10 12:37:48,726] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. + 7: [2023-05-10 12:37:48,726] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. + 7: [2023-05-10 12:37:48,726] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. + 7: [2023-05-10 12:37:48,727] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... + 6: [2023-05-10 12:37:48,727] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... + 7: [2023-05-10 12:37:48,727] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. + 6: [2023-05-10 12:37:48,727] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... + 6: [2023-05-10 12:37:48,728] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. + 7: [2023-05-10 12:37:48,728] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt... + 7: [2023-05-10 12:37:48,728] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt... + 7: [2023-05-10 12:37:48,728] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt... + 7: [2023-05-10 12:37:48,728] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt... +16: [2023-05-10 12:37:48,728] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 134 + 6: [2023-05-10 12:37:48,728] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +17: [2023-05-10 12:37:48,728] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 140 + 6: [2023-05-10 12:37:48,728] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +28: [2023-05-10 12:37:48,728] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 228 + 6: [2023-05-10 12:37:48,729] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +26: [2023-05-10 12:37:48,729] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 212 + 6: [2023-05-10 12:37:48,729] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt... + 6: [2023-05-10 12:37:48,729] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt... +29: [2023-05-10 12:37:48,729] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt. +27: [2023-05-10 12:37:48,729] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_108_mp_rank_00_optim_states.pt. +29: [2023-05-10 12:37:48,729] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt. +27: [2023-05-10 12:37:48,730] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 216 + 6: [2023-05-10 12:37:48,730] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +10: [2023-05-10 12:37:48,730] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 84 +29: [2023-05-10 12:37:48,730] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt. +19: [2023-05-10 12:37:48,730] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_77_mp_rank_00_optim_states.pt. +19: [2023-05-10 12:37:48,730] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 154 + 6: [2023-05-10 12:37:48,730] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +29: [2023-05-10 12:37:48,730] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt. + 6: [2023-05-10 12:37:48,730] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt... +19: [2023-05-10 12:37:48,730] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt. + 6: [2023-05-10 12:37:48,731] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt... +19: [2023-05-10 12:37:48,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt. +19: [2023-05-10 12:37:48,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt. +19: [2023-05-10 12:37:48,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt. + 7: [2023-05-10 12:37:48,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt. + 7: [2023-05-10 12:37:48,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt. + 7: [2023-05-10 12:37:48,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt. + 7: [2023-05-10 12:37:48,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt. +11: [2023-05-10 12:37:48,732] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt. +11: [2023-05-10 12:37:48,732] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt. +11: [2023-05-10 12:37:48,732] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt. +17: [2023-05-10 12:37:48,732] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +11: [2023-05-10 12:37:48,732] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt. +17: [2023-05-10 12:37:48,733] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +17: [2023-05-10 12:37:48,733] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +17: [2023-05-10 12:37:48,733] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +17: [2023-05-10 12:37:48,733] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +17: [2023-05-10 12:37:48,733] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +27: [2023-05-10 12:37:48,733] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... + 2: [2023-05-10 12:37:48,734] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +17: [2023-05-10 12:37:48,734] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt... +17: [2023-05-10 12:37:48,734] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt... +20: [2023-05-10 12:37:48,734] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_80_mp_rank_00_optim_states.pt. +17: [2023-05-10 12:37:48,734] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt... + 2: [2023-05-10 12:37:48,734] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +17: [2023-05-10 12:37:48,734] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +27: [2023-05-10 12:37:48,734] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +20: [2023-05-10 12:37:48,734] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 160 +17: [2023-05-10 12:37:48,734] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_68_mp_rank_00_optim_states.pt. + 2: [2023-05-10 12:37:48,734] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. + 2: [2023-05-10 12:37:48,734] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +17: [2023-05-10 12:37:48,734] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +19: [2023-05-10 12:37:48,734] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 154 +17: [2023-05-10 12:37:48,734] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 136 +17: [2023-05-10 12:37:48,734] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt... + 2: [2023-05-10 12:37:48,734] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +27: [2023-05-10 12:37:48,735] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 216 + 2: [2023-05-10 12:37:48,735] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +27: [2023-05-10 12:37:48,736] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... + 6: [2023-05-10 12:37:48,736] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt. + 6: [2023-05-10 12:37:48,736] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt. + 6: [2023-05-10 12:37:48,736] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt. +27: [2023-05-10 12:37:48,736] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +27: [2023-05-10 12:37:48,736] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +27: [2023-05-10 12:37:48,736] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... + 2: [2023-05-10 12:37:48,736] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +17: [2023-05-10 12:37:48,736] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt. +17: [2023-05-10 12:37:48,736] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt. +17: [2023-05-10 12:37:48,736] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt. +16: [2023-05-10 12:37:48,736] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt. +17: [2023-05-10 12:37:48,737] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt. +27: [2023-05-10 12:37:48,737] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +27: [2023-05-10 12:37:48,737] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +27: [2023-05-10 12:37:48,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt... +27: [2023-05-10 12:37:48,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt... + 6: [2023-05-10 12:37:48,737] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt. + 2: [2023-05-10 12:37:48,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt... + 2: [2023-05-10 12:37:48,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt... + 2: [2023-05-10 12:37:48,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt... +27: [2023-05-10 12:37:48,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt... +27: [2023-05-10 12:37:48,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt... +16: [2023-05-10 12:37:48,737] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt. + 2: [2023-05-10 12:37:48,737] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. + 2: [2023-05-10 12:37:48,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt... +16: [2023-05-10 12:37:48,738] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt. +16: [2023-05-10 12:37:48,738] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt. +20: [2023-05-10 12:37:48,738] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 160 +17: [2023-05-10 12:37:48,739] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 136 + 2: [2023-05-10 12:37:48,739] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt. + 2: [2023-05-10 12:37:48,739] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt. + 2: [2023-05-10 12:37:48,739] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt. +20: [2023-05-10 12:37:48,739] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt. + 2: [2023-05-10 12:37:48,739] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt. + 4: [2023-05-10 12:37:48,738] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt. + 4: [2023-05-10 12:37:48,738] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt. + 4: [2023-05-10 12:37:48,738] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt. +29: [2023-05-10 12:37:48,739] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +29: [2023-05-10 12:37:48,739] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +20: [2023-05-10 12:37:48,739] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt. +20: [2023-05-10 12:37:48,739] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt. +29: [2023-05-10 12:37:48,739] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... + 4: [2023-05-10 12:37:48,739] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt. +20: [2023-05-10 12:37:48,739] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt. +27: [2023-05-10 12:37:48,740] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt. +27: [2023-05-10 12:37:48,740] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt. +27: [2023-05-10 12:37:48,740] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt. +29: [2023-05-10 12:37:48,740] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +29: [2023-05-10 12:37:48,740] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +27: [2023-05-10 12:37:48,740] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt. +29: [2023-05-10 12:37:48,740] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +19: [2023-05-10 12:37:48,740] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +19: [2023-05-10 12:37:48,741] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +29: [2023-05-10 12:37:48,741] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +19: [2023-05-10 12:37:48,741] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +19: [2023-05-10 12:37:48,741] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +29: [2023-05-10 12:37:48,741] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +19: [2023-05-10 12:37:48,742] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +19: [2023-05-10 12:37:48,742] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +11: [2023-05-10 12:37:48,742] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +11: [2023-05-10 12:37:48,742] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +11: [2023-05-10 12:37:48,742] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +12: [2023-05-10 12:37:48,742] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_49_mp_rank_00_optim_states.pt. +11: [2023-05-10 12:37:48,743] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +12: [2023-05-10 12:37:48,743] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 98 +11: [2023-05-10 12:37:48,743] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt... +11: [2023-05-10 12:37:48,743] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +11: [2023-05-10 12:37:48,743] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt... +11: [2023-05-10 12:37:48,743] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +18: [2023-05-10 12:37:48,743] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_72_mp_rank_01_optim_states.pt... +18: [2023-05-10 12:37:48,743] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_74_mp_rank_01_optim_states.pt... +11: [2023-05-10 12:37:48,743] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +18: [2023-05-10 12:37:48,743] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_75_mp_rank_01_optim_states.pt... +18: [2023-05-10 12:37:48,743] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_73_mp_rank_01_optim_states.pt... +11: [2023-05-10 12:37:48,743] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +11: [2023-05-10 12:37:48,743] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt... +11: [2023-05-10 12:37:48,744] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt... +29: [2023-05-10 12:37:48,744] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt... + 0: [2023-05-10 12:37:48,744] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt. +29: [2023-05-10 12:37:48,744] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt... +29: [2023-05-10 12:37:48,744] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt... +29: [2023-05-10 12:37:48,744] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt... + 0: [2023-05-10 12:37:48,744] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 4 +19: [2023-05-10 12:37:48,744] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +19: [2023-05-10 12:37:48,745] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +19: [2023-05-10 12:37:48,745] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt... +19: [2023-05-10 12:37:48,745] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt... +19: [2023-05-10 12:37:48,745] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt... +19: [2023-05-10 12:37:48,746] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt... +16: [2023-05-10 12:37:48,746] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +29: [2023-05-10 12:37:48,746] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt. +29: [2023-05-10 12:37:48,746] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt. +29: [2023-05-10 12:37:48,746] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt. +16: [2023-05-10 12:37:48,746] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +16: [2023-05-10 12:37:48,747] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +29: [2023-05-10 12:37:48,747] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt. +16: [2023-05-10 12:37:48,747] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +11: [2023-05-10 12:37:48,747] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt. +11: [2023-05-10 12:37:48,747] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt. +11: [2023-05-10 12:37:48,747] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt. +16: [2023-05-10 12:37:48,747] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +11: [2023-05-10 12:37:48,747] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt. +16: [2023-05-10 12:37:48,747] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +19: [2023-05-10 12:37:48,748] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt. +19: [2023-05-10 12:37:48,748] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt. +12: [2023-05-10 12:37:48,748] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 98 +19: [2023-05-10 12:37:48,748] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt. +16: [2023-05-10 12:37:48,748] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +16: [2023-05-10 12:37:48,748] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +19: [2023-05-10 12:37:48,748] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt. + 4: [2023-05-10 12:37:48,748] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... + 4: [2023-05-10 12:37:48,748] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... + 0: [2023-05-10 12:37:48,748] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 4 + 4: [2023-05-10 12:37:48,748] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. + 4: [2023-05-10 12:37:48,749] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +20: [2023-05-10 12:37:48,749] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... + 4: [2023-05-10 12:37:48,749] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +30: [2023-05-10 12:37:48,749] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_122_mp_rank_00_optim_states.pt. +30: [2023-05-10 12:37:48,749] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 244 +20: [2023-05-10 12:37:48,749] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +20: [2023-05-10 12:37:48,749] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... + 4: [2023-05-10 12:37:48,749] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +20: [2023-05-10 12:37:48,749] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +16: [2023-05-10 12:37:48,750] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt... +16: [2023-05-10 12:37:48,750] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt... +16: [2023-05-10 12:37:48,750] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt... +16: [2023-05-10 12:37:48,750] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt... +20: [2023-05-10 12:37:48,750] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +20: [2023-05-10 12:37:48,750] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +20: [2023-05-10 12:37:48,750] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt... + 4: [2023-05-10 12:37:48,750] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +20: [2023-05-10 12:37:48,750] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt... +20: [2023-05-10 12:37:48,750] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt... + 4: [2023-05-10 12:37:48,751] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +28: [2023-05-10 12:37:48,751] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_112_mp_rank_00_optim_states.pt. +28: [2023-05-10 12:37:48,751] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 224 +14: [2023-05-10 12:37:48,752] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_58_mp_rank_01_optim_states.pt... +14: [2023-05-10 12:37:48,752] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_56_mp_rank_01_optim_states.pt... +14: [2023-05-10 12:37:48,752] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_59_mp_rank_01_optim_states.pt... +14: [2023-05-10 12:37:48,752] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_57_mp_rank_01_optim_states.pt... + 4: [2023-05-10 12:37:48,752] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt... + 4: [2023-05-10 12:37:48,752] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt... + 4: [2023-05-10 12:37:48,752] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt... + 4: [2023-05-10 12:37:48,752] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt... + 9: [2023-05-10 12:37:48,753] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt. + 9: [2023-05-10 12:37:48,753] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt. +30: [2023-05-10 12:37:48,753] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 244 + 9: [2023-05-10 12:37:48,753] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt. +20: [2023-05-10 12:37:48,754] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +20: [2023-05-10 12:37:48,754] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt. +20: [2023-05-10 12:37:48,754] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt. + 9: [2023-05-10 12:37:48,754] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt. +20: [2023-05-10 12:37:48,754] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +20: [2023-05-10 12:37:48,754] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt. +16: [2023-05-10 12:37:48,754] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt. +20: [2023-05-10 12:37:48,754] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt... +16: [2023-05-10 12:37:48,754] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt. +16: [2023-05-10 12:37:48,754] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt. +16: [2023-05-10 12:37:48,754] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt. +12: [2023-05-10 12:37:48,755] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt. +12: [2023-05-10 12:37:48,755] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt. +12: [2023-05-10 12:37:48,755] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt. +20: [2023-05-10 12:37:48,755] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt. +28: [2023-05-10 12:37:48,755] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 224 + 4: [2023-05-10 12:37:48,755] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt. + 4: [2023-05-10 12:37:48,755] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt. + 4: [2023-05-10 12:37:48,756] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt. + 4: [2023-05-10 12:37:48,756] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt. +12: [2023-05-10 12:37:48,756] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt. +19: [2023-05-10 12:37:48,757] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_78_mp_rank_00_optim_states.pt. +19: [2023-05-10 12:37:48,757] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 156 +19: [2023-05-10 12:37:48,758] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_76_mp_rank_00_optim_states.pt. +19: [2023-05-10 12:37:48,758] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 152 +15: [2023-05-10 12:37:48,758] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_63_mp_rank_00_optim_states.pt. +15: [2023-05-10 12:37:48,758] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 126 +19: [2023-05-10 12:37:48,761] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 156 + 9: [2023-05-10 12:37:48,762] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +15: [2023-05-10 12:37:48,763] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 126 + 9: [2023-05-10 12:37:48,763] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +21: [2023-05-10 12:37:48,763] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_84_mp_rank_01_optim_states.pt... +21: [2023-05-10 12:37:48,763] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_85_mp_rank_01_optim_states.pt... +21: [2023-05-10 12:37:48,763] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_86_mp_rank_01_optim_states.pt... +21: [2023-05-10 12:37:48,763] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_87_mp_rank_01_optim_states.pt... +19: [2023-05-10 12:37:48,764] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 152 + 9: [2023-05-10 12:37:48,764] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +17: [2023-05-10 12:37:48,764] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_71_mp_rank_00_optim_states.pt. + 9: [2023-05-10 12:37:48,764] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +17: [2023-05-10 12:37:48,764] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 142 + 9: [2023-05-10 12:37:48,765] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... + 9: [2023-05-10 12:37:48,765] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +12: [2023-05-10 12:37:48,766] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +12: [2023-05-10 12:37:48,766] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +12: [2023-05-10 12:37:48,766] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +12: [2023-05-10 12:37:48,766] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +12: [2023-05-10 12:37:48,766] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +12: [2023-05-10 12:37:48,767] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +12: [2023-05-10 12:37:48,767] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +12: [2023-05-10 12:37:48,767] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. + 9: [2023-05-10 12:37:48,767] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... + 9: [2023-05-10 12:37:48,767] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +12: [2023-05-10 12:37:48,767] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt... +12: [2023-05-10 12:37:48,767] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt... +12: [2023-05-10 12:37:48,767] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt... +12: [2023-05-10 12:37:48,767] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt... +16: [2023-05-10 12:37:48,767] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_64_mp_rank_00_optim_states.pt. +31: [2023-05-10 12:37:48,767] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt. +16: [2023-05-10 12:37:48,767] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 128 +31: [2023-05-10 12:37:48,768] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt. +31: [2023-05-10 12:37:48,768] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt. +17: [2023-05-10 12:37:48,768] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 142 +31: [2023-05-10 12:37:48,769] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt. +12: [2023-05-10 12:37:48,769] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt. +12: [2023-05-10 12:37:48,769] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt. +12: [2023-05-10 12:37:48,769] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt. +12: [2023-05-10 12:37:48,770] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt. + 9: [2023-05-10 12:37:48,771] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt... + 9: [2023-05-10 12:37:48,771] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt... + 9: [2023-05-10 12:37:48,771] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt... + 9: [2023-05-10 12:37:48,772] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt... + 2: [2023-05-10 12:37:48,772] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_8_mp_rank_00_optim_states.pt. + 2: [2023-05-10 12:37:48,772] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 16 +17: [2023-05-10 12:37:48,772] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_69_mp_rank_01_optim_states.pt... +17: [2023-05-10 12:37:48,772] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_68_mp_rank_01_optim_states.pt... +17: [2023-05-10 12:37:48,772] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_71_mp_rank_01_optim_states.pt... +17: [2023-05-10 12:37:48,772] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_70_mp_rank_01_optim_states.pt... +16: [2023-05-10 12:37:48,773] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 128 + 2: [2023-05-10 12:37:48,776] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_8_mp_rank_01_optim_states.pt... + 2: [2023-05-10 12:37:48,776] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_10_mp_rank_01_optim_states.pt... + 2: [2023-05-10 12:37:48,776] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_9_mp_rank_01_optim_states.pt... + 2: [2023-05-10 12:37:48,776] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_11_mp_rank_01_optim_states.pt... + 2: [2023-05-10 12:37:48,777] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 16 +31: [2023-05-10 12:37:48,777] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +31: [2023-05-10 12:37:48,778] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +31: [2023-05-10 12:37:48,779] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt... +12: [2023-05-10 12:37:48,779] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_51_mp_rank_00_optim_states.pt. +12: [2023-05-10 12:37:48,779] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 102 +25: [2023-05-10 12:37:48,779] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt. +25: [2023-05-10 12:37:48,779] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt. +25: [2023-05-10 12:37:48,779] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt. +25: [2023-05-10 12:37:48,780] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt. + 9: [2023-05-10 12:37:48,780] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt. + 9: [2023-05-10 12:37:48,780] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt. + 9: [2023-05-10 12:37:48,780] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt. +31: [2023-05-10 12:37:48,780] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... + 9: [2023-05-10 12:37:48,780] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt. +31: [2023-05-10 12:37:48,780] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +31: [2023-05-10 12:37:48,780] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +31: [2023-05-10 12:37:48,781] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +31: [2023-05-10 12:37:48,781] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +31: [2023-05-10 12:37:48,781] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +31: [2023-05-10 12:37:48,781] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt... +31: [2023-05-10 12:37:48,781] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt... +31: [2023-05-10 12:37:48,781] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt... +31: [2023-05-10 12:37:48,781] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt. +31: [2023-05-10 12:37:48,781] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt. +31: [2023-05-10 12:37:48,781] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt. +31: [2023-05-10 12:37:48,782] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt. +13: [2023-05-10 12:37:48,783] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_55_mp_rank_00_optim_states.pt. +13: [2023-05-10 12:37:48,783] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 110 +22: [2023-05-10 12:37:48,783] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_88_mp_rank_01_optim_states.pt... +22: [2023-05-10 12:37:48,783] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_89_mp_rank_01_optim_states.pt... +22: [2023-05-10 12:37:48,783] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_90_mp_rank_01_optim_states.pt... +22: [2023-05-10 12:37:48,783] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_91_mp_rank_01_optim_states.pt... +27: [2023-05-10 12:37:48,784] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_109_mp_rank_01_optim_states.pt... +27: [2023-05-10 12:37:48,784] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_111_mp_rank_01_optim_states.pt... +27: [2023-05-10 12:37:48,784] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_110_mp_rank_01_optim_states.pt... +27: [2023-05-10 12:37:48,784] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_108_mp_rank_01_optim_states.pt... +12: [2023-05-10 12:37:48,784] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 102 + 6: [2023-05-10 12:37:48,785] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_26_mp_rank_00_optim_states.pt. + 6: [2023-05-10 12:37:48,785] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 52 +13: [2023-05-10 12:37:48,787] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 110 + 7: [2023-05-10 12:37:48,788] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_28_mp_rank_01_optim_states.pt... + 7: [2023-05-10 12:37:48,788] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_29_mp_rank_01_optim_states.pt... + 7: [2023-05-10 12:37:48,788] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_30_mp_rank_01_optim_states.pt... + 7: [2023-05-10 12:37:48,788] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_31_mp_rank_01_optim_states.pt... +27: [2023-05-10 12:37:48,788] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_109_mp_rank_00_optim_states.pt. +25: [2023-05-10 12:37:48,788] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +27: [2023-05-10 12:37:48,789] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 218 +25: [2023-05-10 12:37:48,789] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +25: [2023-05-10 12:37:48,789] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +25: [2023-05-10 12:37:48,789] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +25: [2023-05-10 12:37:48,789] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +25: [2023-05-10 12:37:48,790] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. + 6: [2023-05-10 12:37:48,790] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 52 +25: [2023-05-10 12:37:48,791] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +25: [2023-05-10 12:37:48,792] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +27: [2023-05-10 12:37:48,793] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 218 +25: [2023-05-10 12:37:48,793] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt... +25: [2023-05-10 12:37:48,793] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt... +25: [2023-05-10 12:37:48,793] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt... +25: [2023-05-10 12:37:48,793] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt... +25: [2023-05-10 12:37:48,796] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt. +25: [2023-05-10 12:37:48,796] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt. +25: [2023-05-10 12:37:48,796] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt. +25: [2023-05-10 12:37:48,796] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt. +19: [2023-05-10 12:37:48,796] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_76_mp_rank_01_optim_states.pt... +19: [2023-05-10 12:37:48,796] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_77_mp_rank_01_optim_states.pt... +19: [2023-05-10 12:37:48,796] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_79_mp_rank_01_optim_states.pt... +19: [2023-05-10 12:37:48,796] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_78_mp_rank_01_optim_states.pt... +16: [2023-05-10 12:37:48,797] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_65_mp_rank_01_optim_states.pt... +16: [2023-05-10 12:37:48,797] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_66_mp_rank_01_optim_states.pt... +16: [2023-05-10 12:37:48,797] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_64_mp_rank_01_optim_states.pt... +16: [2023-05-10 12:37:48,797] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_67_mp_rank_01_optim_states.pt... +29: [2023-05-10 12:37:48,798] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_119_mp_rank_01_optim_states.pt... +29: [2023-05-10 12:37:48,798] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_117_mp_rank_01_optim_states.pt... +29: [2023-05-10 12:37:48,798] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_116_mp_rank_01_optim_states.pt... +29: [2023-05-10 12:37:48,798] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_118_mp_rank_01_optim_states.pt... + 6: [2023-05-10 12:37:48,801] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_25_mp_rank_01_optim_states.pt... + 6: [2023-05-10 12:37:48,801] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_26_mp_rank_01_optim_states.pt... + 6: [2023-05-10 12:37:48,801] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_24_mp_rank_01_optim_states.pt... + 6: [2023-05-10 12:37:48,801] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_27_mp_rank_01_optim_states.pt... +12: [2023-05-10 12:37:48,804] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_50_mp_rank_01_optim_states.pt... +12: [2023-05-10 12:37:48,804] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_49_mp_rank_01_optim_states.pt... +12: [2023-05-10 12:37:48,804] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_48_mp_rank_01_optim_states.pt... +12: [2023-05-10 12:37:48,804] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_51_mp_rank_01_optim_states.pt... +13: [2023-05-10 12:37:48,805] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt. +13: [2023-05-10 12:37:48,806] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt. +13: [2023-05-10 12:37:48,806] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt. +13: [2023-05-10 12:37:48,806] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_36-model_01-model_states.pt. + 8: [2023-05-10 12:37:48,808] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_34_mp_rank_00_optim_states.pt. + 8: [2023-05-10 12:37:48,809] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 68 +23: [2023-05-10 12:37:48,809] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_92_mp_rank_00_optim_states.pt. +23: [2023-05-10 12:37:48,809] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 184 +11: [2023-05-10 12:37:48,809] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_45_mp_rank_01_optim_states.pt... +11: [2023-05-10 12:37:48,809] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_47_mp_rank_01_optim_states.pt... +11: [2023-05-10 12:37:48,809] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_44_mp_rank_01_optim_states.pt... +11: [2023-05-10 12:37:48,809] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_46_mp_rank_01_optim_states.pt... + 0: [2023-05-10 12:37:48,812] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt. + 0: [2023-05-10 12:37:48,812] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 2 +23: [2023-05-10 12:37:48,814] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 184 + 8: [2023-05-10 12:37:48,814] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 68 +13: [2023-05-10 12:37:48,815] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +13: [2023-05-10 12:37:48,815] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +13: [2023-05-10 12:37:48,816] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +13: [2023-05-10 12:37:48,816] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +13: [2023-05-10 12:37:48,816] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +13: [2023-05-10 12:37:48,816] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +13: [2023-05-10 12:37:48,817] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt... +26: [2023-05-10 12:37:48,817] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_104_mp_rank_00_optim_states.pt. +16: [2023-05-10 12:37:48,817] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_65_mp_rank_00_optim_states.pt. +26: [2023-05-10 12:37:48,817] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 208 +13: [2023-05-10 12:37:48,817] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_00-model_states.pt. +16: [2023-05-10 12:37:48,817] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 130 +20: [2023-05-10 12:37:48,817] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_83_mp_rank_01_optim_states.pt... +20: [2023-05-10 12:37:48,817] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_82_mp_rank_01_optim_states.pt... +20: [2023-05-10 12:37:48,817] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_81_mp_rank_01_optim_states.pt... +20: [2023-05-10 12:37:48,817] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_80_mp_rank_01_optim_states.pt... + 0: [2023-05-10 12:37:48,818] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 2 +20: [2023-05-10 12:37:48,818] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_83_mp_rank_00_optim_states.pt. +20: [2023-05-10 12:37:48,819] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 166 +31: [2023-05-10 12:37:48,820] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_127_mp_rank_01_optim_states.pt... +31: [2023-05-10 12:37:48,820] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_124_mp_rank_01_optim_states.pt... +31: [2023-05-10 12:37:48,820] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_126_mp_rank_01_optim_states.pt... +31: [2023-05-10 12:37:48,820] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_125_mp_rank_01_optim_states.pt... + 1: [2023-05-10 12:37:48,821] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt. +26: [2023-05-10 12:37:48,821] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 208 + 1: [2023-05-10 12:37:48,821] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 10 +16: [2023-05-10 12:37:48,822] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 130 +13: [2023-05-10 12:37:48,823] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt... +13: [2023-05-10 12:37:48,823] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt... +13: [2023-05-10 12:37:48,823] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt... +13: [2023-05-10 12:37:48,823] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt... +20: [2023-05-10 12:37:48,824] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 166 +25: [2023-05-10 12:37:48,825] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_100_mp_rank_00_optim_states.pt. + 4: [2023-05-10 12:37:48,825] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_16_mp_rank_01_optim_states.pt... + 4: [2023-05-10 12:37:48,825] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_18_mp_rank_01_optim_states.pt... + 4: [2023-05-10 12:37:48,825] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_17_mp_rank_01_optim_states.pt... + 4: [2023-05-10 12:37:48,825] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_19_mp_rank_01_optim_states.pt... +25: [2023-05-10 12:37:48,825] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 200 + 0: [2023-05-10 12:37:48,825] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt. + 0: [2023-05-10 12:37:48,825] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 0 + 9: [2023-05-10 12:37:48,827] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_38_mp_rank_01_optim_states.pt... + 9: [2023-05-10 12:37:48,827] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_36_mp_rank_01_optim_states.pt... + 9: [2023-05-10 12:37:48,827] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_37_mp_rank_01_optim_states.pt... +13: [2023-05-10 12:37:48,827] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt. +13: [2023-05-10 12:37:48,827] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt. +13: [2023-05-10 12:37:48,827] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt. + 9: [2023-05-10 12:37:48,827] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_39_mp_rank_01_optim_states.pt... +13: [2023-05-10 12:37:48,827] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/layer_38-model_01-model_states.pt. + 1: [2023-05-10 12:37:48,827] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 10 +25: [2023-05-10 12:37:48,829] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 200 + 0: [2023-05-10 12:37:48,830] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 0 + 0: could not find arguments in the checkpoint ... + 0: checkpoint version 3.0 + 5: [2023-05-10 12:37:48,831] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_22_mp_rank_00_optim_states.pt. + 5: [2023-05-10 12:37:48,831] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 44 +19: [2023-05-10 12:37:48,835] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_79_mp_rank_00_optim_states.pt. +19: [2023-05-10 12:37:48,835] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 158 + 5: [2023-05-10 12:37:48,835] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 44 +30: [2023-05-10 12:37:48,837] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_123_mp_rank_01_optim_states.pt. +30: [2023-05-10 12:37:48,837] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 247 +11: [2023-05-10 12:37:48,837] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_47_mp_rank_00_optim_states.pt. +13: [2023-05-10 12:37:48,837] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_54_mp_rank_00_optim_states.pt. +11: [2023-05-10 12:37:48,838] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 94 +13: [2023-05-10 12:37:48,838] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 108 +19: [2023-05-10 12:37:48,839] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 158 + 7: [2023-05-10 12:37:48,841] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_29_mp_rank_00_optim_states.pt. + 7: [2023-05-10 12:37:48,841] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 58 +30: [2023-05-10 12:37:48,842] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 247 +24: [2023-05-10 12:37:48,842] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_98_mp_rank_01_optim_states.pt. +11: [2023-05-10 12:37:48,842] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 94 +24: [2023-05-10 12:37:48,842] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 197 +13: [2023-05-10 12:37:48,843] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 108 +10: [2023-05-10 12:37:48,843] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_41_mp_rank_00_optim_states.pt. +10: [2023-05-10 12:37:48,843] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 82 +24: [2023-05-10 12:37:48,846] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 197 + 7: [2023-05-10 12:37:48,847] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 58 +10: [2023-05-10 12:37:48,847] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 82 +26: [2023-05-10 12:37:48,849] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_105_mp_rank_01_optim_states.pt. +26: [2023-05-10 12:37:48,850] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 211 +26: [2023-05-10 12:37:48,854] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 211 +10: [2023-05-10 12:37:48,857] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_40_mp_rank_00_optim_states.pt. +10: [2023-05-10 12:37:48,857] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 80 +20: [2023-05-10 12:37:48,858] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_82_mp_rank_00_optim_states.pt. +20: [2023-05-10 12:37:48,858] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 164 +10: [2023-05-10 12:37:48,861] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 80 + 9: [2023-05-10 12:37:48,863] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_36_mp_rank_00_optim_states.pt. + 9: [2023-05-10 12:37:48,864] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 72 +20: [2023-05-10 12:37:48,864] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 164 +25: [2023-05-10 12:37:48,866] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_102_mp_rank_01_optim_states.pt... +25: [2023-05-10 12:37:48,866] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_101_mp_rank_01_optim_states.pt... +26: [2023-05-10 12:37:48,866] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_107_mp_rank_01_optim_states.pt. +26: [2023-05-10 12:37:48,866] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 215 +25: [2023-05-10 12:37:48,866] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_103_mp_rank_01_optim_states.pt... +25: [2023-05-10 12:37:48,866] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_100_mp_rank_01_optim_states.pt... + 9: [2023-05-10 12:37:48,868] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 72 + 7: [2023-05-10 12:37:48,868] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_31_mp_rank_00_optim_states.pt. +28: [2023-05-10 12:37:48,868] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_115_mp_rank_01_optim_states.pt. +28: [2023-05-10 12:37:48,868] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 231 + 7: [2023-05-10 12:37:48,868] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 62 +13: [2023-05-10 12:37:48,870] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_52_mp_rank_01_optim_states.pt... +13: [2023-05-10 12:37:48,870] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_54_mp_rank_01_optim_states.pt... +13: [2023-05-10 12:37:48,870] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_53_mp_rank_01_optim_states.pt... +13: [2023-05-10 12:37:48,870] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_55_mp_rank_01_optim_states.pt... +26: [2023-05-10 12:37:48,870] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 215 + 4: [2023-05-10 12:37:48,871] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_18_mp_rank_00_optim_states.pt. + 4: [2023-05-10 12:37:48,871] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 36 +28: [2023-05-10 12:37:48,873] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 231 + 7: [2023-05-10 12:37:48,873] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 62 +29: [2023-05-10 12:37:48,874] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_117_mp_rank_00_optim_states.pt. +29: [2023-05-10 12:37:48,874] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 234 + 4: [2023-05-10 12:37:48,877] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 36 +13: [2023-05-10 12:37:48,878] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_52_mp_rank_00_optim_states.pt. +13: [2023-05-10 12:37:48,878] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 104 +29: [2023-05-10 12:37:48,879] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_116_mp_rank_00_optim_states.pt. +29: [2023-05-10 12:37:48,879] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 232 + 3: [2023-05-10 12:37:48,880] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt. + 3: [2023-05-10 12:37:48,880] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 26 +29: [2023-05-10 12:37:48,880] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 234 +13: [2023-05-10 12:37:48,883] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 104 +25: [2023-05-10 12:37:48,884] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_103_mp_rank_00_optim_states.pt. + 3: [2023-05-10 12:37:48,884] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 26 +25: [2023-05-10 12:37:48,884] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 206 + 4: [2023-05-10 12:37:48,884] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_16_mp_rank_00_optim_states.pt. +29: [2023-05-10 12:37:48,884] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 232 + 4: [2023-05-10 12:37:48,885] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 32 + 9: [2023-05-10 12:37:48,885] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_37_mp_rank_00_optim_states.pt. + 9: [2023-05-10 12:37:48,886] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 74 +25: [2023-05-10 12:37:48,889] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 206 + 4: [2023-05-10 12:37:48,889] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 32 + 9: [2023-05-10 12:37:48,890] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 74 +30: [2023-05-10 12:37:48,894] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_121_mp_rank_01_optim_states.pt. +30: [2023-05-10 12:37:48,894] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 243 +15: [2023-05-10 12:37:48,895] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_62_mp_rank_00_optim_states.pt. +15: [2023-05-10 12:37:48,895] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 124 +30: [2023-05-10 12:37:48,898] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 243 +28: [2023-05-10 12:37:48,899] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_114_mp_rank_01_optim_states.pt. +28: [2023-05-10 12:37:48,899] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 229 +15: [2023-05-10 12:37:48,900] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 124 +28: [2023-05-10 12:37:48,903] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 229 +18: [2023-05-10 12:37:48,904] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_73_mp_rank_00_optim_states.pt. +18: [2023-05-10 12:37:48,904] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 146 + 5: [2023-05-10 12:37:48,906] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_21_mp_rank_00_optim_states.pt. + 5: [2023-05-10 12:37:48,907] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 42 +18: [2023-05-10 12:37:48,909] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 146 + 4: [2023-05-10 12:37:48,911] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_19_mp_rank_00_optim_states.pt. +20: [2023-05-10 12:37:48,911] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_81_mp_rank_00_optim_states.pt. +20: [2023-05-10 12:37:48,911] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 162 + 4: [2023-05-10 12:37:48,911] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 38 + 5: [2023-05-10 12:37:48,911] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 42 +28: [2023-05-10 12:37:48,912] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_112_mp_rank_01_optim_states.pt. +28: [2023-05-10 12:37:48,912] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 225 +11: [2023-05-10 12:37:48,915] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_46_mp_rank_00_optim_states.pt. +11: [2023-05-10 12:37:48,915] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 92 +20: [2023-05-10 12:37:48,915] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 162 + 4: [2023-05-10 12:37:48,915] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 38 +28: [2023-05-10 12:37:48,916] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 225 +10: [2023-05-10 12:37:48,919] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_43_mp_rank_00_optim_states.pt. +10: [2023-05-10 12:37:48,920] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 86 +11: [2023-05-10 12:37:48,920] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 92 +10: [2023-05-10 12:37:48,924] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 86 +30: [2023-05-10 12:37:48,925] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_120_mp_rank_01_optim_states.pt. +30: [2023-05-10 12:37:48,925] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 241 +11: [2023-05-10 12:37:48,925] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_44_mp_rank_00_optim_states.pt. +11: [2023-05-10 12:37:48,926] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 88 + 6: [2023-05-10 12:37:48,927] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_25_mp_rank_00_optim_states.pt. + 6: [2023-05-10 12:37:48,927] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 50 + 1: [2023-05-10 12:37:48,927] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt. + 1: [2023-05-10 12:37:48,928] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 12 +30: [2023-05-10 12:37:48,929] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 241 + 9: [2023-05-10 12:37:48,929] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_38_mp_rank_00_optim_states.pt. +21: [2023-05-10 12:37:48,930] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_84_mp_rank_00_optim_states.pt. + 9: [2023-05-10 12:37:48,930] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 76 +21: [2023-05-10 12:37:48,930] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 168 +11: [2023-05-10 12:37:48,930] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 88 + 6: [2023-05-10 12:37:48,932] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 50 +29: [2023-05-10 12:37:48,932] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_118_mp_rank_00_optim_states.pt. +29: [2023-05-10 12:37:48,932] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 236 + 1: [2023-05-10 12:37:48,932] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 12 + 9: [2023-05-10 12:37:48,934] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_39_mp_rank_00_optim_states.pt. + 9: [2023-05-10 12:37:48,934] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 78 +21: [2023-05-10 12:37:48,934] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 168 + 9: [2023-05-10 12:37:48,935] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 76 +29: [2023-05-10 12:37:48,936] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 236 + 5: [2023-05-10 12:37:48,938] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_23_mp_rank_00_optim_states.pt. +28: [2023-05-10 12:37:48,938] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_113_mp_rank_01_optim_states.pt. + 9: [2023-05-10 12:37:48,938] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 78 +28: [2023-05-10 12:37:48,938] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 227 + 5: [2023-05-10 12:37:48,938] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 46 +24: [2023-05-10 12:37:48,942] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_99_mp_rank_01_optim_states.pt. + 5: [2023-05-10 12:37:48,942] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 46 +24: [2023-05-10 12:37:48,943] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 199 +28: [2023-05-10 12:37:48,943] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 227 +18: [2023-05-10 12:37:48,944] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_75_mp_rank_00_optim_states.pt. +18: [2023-05-10 12:37:48,944] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 150 +11: [2023-05-10 12:37:48,945] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_45_mp_rank_00_optim_states.pt. +11: [2023-05-10 12:37:48,946] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 90 +24: [2023-05-10 12:37:48,947] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 199 +18: [2023-05-10 12:37:48,949] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 150 + 6: [2023-05-10 12:37:48,949] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_24_mp_rank_00_optim_states.pt. + 6: [2023-05-10 12:37:48,949] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 48 +11: [2023-05-10 12:37:48,951] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 90 + 3: [2023-05-10 12:37:48,951] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt. + 3: [2023-05-10 12:37:48,951] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 30 +21: [2023-05-10 12:37:48,952] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_87_mp_rank_00_optim_states.pt. +21: [2023-05-10 12:37:48,952] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 174 +18: [2023-05-10 12:37:48,953] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_74_mp_rank_00_optim_states.pt. + 6: [2023-05-10 12:37:48,954] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 48 +18: [2023-05-10 12:37:48,953] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 148 +23: [2023-05-10 12:37:48,954] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_94_mp_rank_00_optim_states.pt. +23: [2023-05-10 12:37:48,955] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 188 + 1: [2023-05-10 12:37:48,955] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_6_mp_rank_01_optim_states.pt. + 3: [2023-05-10 12:37:48,955] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 30 + 1: [2023-05-10 12:37:48,955] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 13 +21: [2023-05-10 12:37:48,957] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 174 +18: [2023-05-10 12:37:48,957] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 148 +13: [2023-05-10 12:37:48,958] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_53_mp_rank_00_optim_states.pt. +13: [2023-05-10 12:37:48,958] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 106 + 1: [2023-05-10 12:37:48,959] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt. +23: [2023-05-10 12:37:48,959] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 188 + 1: [2023-05-10 12:37:48,959] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 8 +26: [2023-05-10 12:37:48,959] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_104_mp_rank_01_optim_states.pt. +26: [2023-05-10 12:37:48,960] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 209 + 1: [2023-05-10 12:37:48,960] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 13 + 4: [2023-05-10 12:37:48,962] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_17_mp_rank_00_optim_states.pt. + 4: [2023-05-10 12:37:48,962] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 34 +13: [2023-05-10 12:37:48,963] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 106 + 1: [2023-05-10 12:37:48,964] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 8 +26: [2023-05-10 12:37:48,964] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 209 + 4: [2023-05-10 12:37:48,967] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 34 + 3: [2023-05-10 12:37:48,967] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt. + 3: [2023-05-10 12:37:48,967] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 24 +25: [2023-05-10 12:37:48,970] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_102_mp_rank_00_optim_states.pt. +25: [2023-05-10 12:37:48,971] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 204 + 3: [2023-05-10 12:37:48,972] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 24 +22: [2023-05-10 12:37:48,974] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_91_mp_rank_00_optim_states.pt. +22: [2023-05-10 12:37:48,974] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 182 +25: [2023-05-10 12:37:48,975] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 204 +22: [2023-05-10 12:37:48,976] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_89_mp_rank_00_optim_states.pt. +22: [2023-05-10 12:37:48,976] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 178 +10: [2023-05-10 12:37:48,976] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_40_mp_rank_01_optim_states.pt. +10: [2023-05-10 12:37:48,976] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_42_mp_rank_01_optim_states.pt. +10: [2023-05-10 12:37:48,976] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 81 +10: [2023-05-10 12:37:48,976] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 85 + 6: [2023-05-10 12:37:48,978] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_27_mp_rank_00_optim_states.pt. + 6: [2023-05-10 12:37:48,978] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 54 +22: [2023-05-10 12:37:48,979] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 182 +21: [2023-05-10 12:37:48,980] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_85_mp_rank_00_optim_states.pt. +21: [2023-05-10 12:37:48,980] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 170 +24: [2023-05-10 12:37:48,980] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_96_mp_rank_01_optim_states.pt. +24: [2023-05-10 12:37:48,981] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 193 +22: [2023-05-10 12:37:48,981] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 178 +10: [2023-05-10 12:37:48,982] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 81 +10: [2023-05-10 12:37:48,982] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 85 + 6: [2023-05-10 12:37:48,983] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 54 +25: [2023-05-10 12:37:48,984] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_101_mp_rank_00_optim_states.pt. +25: [2023-05-10 12:37:48,984] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 202 +21: [2023-05-10 12:37:48,985] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 170 +24: [2023-05-10 12:37:48,985] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 193 +25: [2023-05-10 12:37:48,989] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 202 + 1: [2023-05-10 12:37:48,990] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt. + 1: [2023-05-10 12:37:48,990] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 14 +24: [2023-05-10 12:37:48,991] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_97_mp_rank_01_optim_states.pt. +24: [2023-05-10 12:37:48,991] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 195 +26: [2023-05-10 12:37:48,993] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_106_mp_rank_01_optim_states.pt. +26: [2023-05-10 12:37:48,993] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 213 + 3: [2023-05-10 12:37:48,995] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt. + 1: [2023-05-10 12:37:48,995] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 14 + 3: [2023-05-10 12:37:48,995] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 28 +24: [2023-05-10 12:37:48,996] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 195 +26: [2023-05-10 12:37:48,998] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 213 + 3: [2023-05-10 12:37:49,000] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 28 +18: [2023-05-10 12:37:49,000] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_72_mp_rank_00_optim_states.pt. +18: [2023-05-10 12:37:49,000] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 144 +18: [2023-05-10 12:37:49,006] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 144 +30: [2023-05-10 12:37:49,006] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_122_mp_rank_01_optim_states.pt. +30: [2023-05-10 12:37:49,006] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 245 +29: [2023-05-10 12:37:49,009] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_119_mp_rank_00_optim_states.pt. +29: [2023-05-10 12:37:49,009] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 238 +30: [2023-05-10 12:37:49,010] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 245 +23: [2023-05-10 12:37:49,013] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_95_mp_rank_00_optim_states.pt. +23: [2023-05-10 12:37:49,013] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 190 + 7: [2023-05-10 12:37:49,014] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_30_mp_rank_00_optim_states.pt. + 7: [2023-05-10 12:37:49,014] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 60 +29: [2023-05-10 12:37:49,014] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 238 +23: [2023-05-10 12:37:49,017] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 190 + 7: [2023-05-10 12:37:49,019] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 60 + 1: [2023-05-10 12:37:49,029] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_5_mp_rank_01_optim_states.pt. + 1: [2023-05-10 12:37:49,029] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 11 + 1: [2023-05-10 12:37:49,033] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 11 + 5: [2023-05-10 12:37:49,040] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_20_mp_rank_00_optim_states.pt. + 5: [2023-05-10 12:37:49,040] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 40 + 5: [2023-05-10 12:37:49,045] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 40 + 1: [2023-05-10 12:37:49,049] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_4_mp_rank_01_optim_states.pt. + 1: [2023-05-10 12:37:49,050] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 9 + 5: [2023-05-10 12:37:49,050] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_22_mp_rank_01_optim_states.pt. + 5: [2023-05-10 12:37:49,050] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 45 +15: [2023-05-10 12:37:49,050] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_62_mp_rank_01_optim_states.pt. +15: [2023-05-10 12:37:49,051] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 125 +23: [2023-05-10 12:37:49,052] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_94_mp_rank_01_optim_states.pt. +23: [2023-05-10 12:37:49,052] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 189 +21: [2023-05-10 12:37:49,052] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_86_mp_rank_00_optim_states.pt. +21: [2023-05-10 12:37:49,053] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 172 + 1: [2023-05-10 12:37:49,054] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 9 + 5: [2023-05-10 12:37:49,054] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 45 +15: [2023-05-10 12:37:49,056] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 125 +23: [2023-05-10 12:37:49,056] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 189 +21: [2023-05-10 12:37:49,057] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 172 +22: [2023-05-10 12:37:49,057] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_88_mp_rank_00_optim_states.pt. +22: [2023-05-10 12:37:49,058] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 176 +22: [2023-05-10 12:37:49,064] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 176 + 5: [2023-05-10 12:37:49,064] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_23_mp_rank_01_optim_states.pt. + 5: [2023-05-10 12:37:49,064] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 47 + 5: [2023-05-10 12:37:49,065] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_21_mp_rank_01_optim_states.pt. + 5: [2023-05-10 12:37:49,065] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 43 + 5: [2023-05-10 12:37:49,069] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 47 + 5: [2023-05-10 12:37:49,070] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 43 + 3: [2023-05-10 12:37:49,078] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_14_mp_rank_01_optim_states.pt. + 3: [2023-05-10 12:37:49,079] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 29 + 3: [2023-05-10 12:37:49,083] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 29 +23: [2023-05-10 12:37:49,097] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_93_mp_rank_00_optim_states.pt. +23: [2023-05-10 12:37:49,098] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 186 +23: [2023-05-10 12:37:49,102] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 186 +21: [2023-05-10 12:37:49,105] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_84_mp_rank_01_optim_states.pt. +21: [2023-05-10 12:37:49,105] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 169 + 8: [2023-05-10 12:37:49,107] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_35_mp_rank_01_optim_states.pt. + 8: [2023-05-10 12:37:49,107] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 71 + 5: [2023-05-10 12:37:49,108] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_20_mp_rank_01_optim_states.pt. + 5: [2023-05-10 12:37:49,108] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 41 +21: [2023-05-10 12:37:49,110] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 169 + 8: [2023-05-10 12:37:49,112] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 71 + 8: [2023-05-10 12:37:49,112] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_32_mp_rank_01_optim_states.pt. + 8: [2023-05-10 12:37:49,112] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 65 +10: [2023-05-10 12:37:49,113] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_41_mp_rank_01_optim_states.pt. +23: [2023-05-10 12:37:49,113] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_95_mp_rank_01_optim_states.pt. + 5: [2023-05-10 12:37:49,113] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 41 +23: [2023-05-10 12:37:49,113] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 191 +10: [2023-05-10 12:37:49,114] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 83 +10: [2023-05-10 12:37:49,114] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_43_mp_rank_01_optim_states.pt. +15: [2023-05-10 12:37:49,114] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_61_mp_rank_01_optim_states.pt. +15: [2023-05-10 12:37:49,115] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 123 +10: [2023-05-10 12:37:49,115] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 87 + 8: [2023-05-10 12:37:49,116] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 65 +10: [2023-05-10 12:37:49,118] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 83 +23: [2023-05-10 12:37:49,118] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 191 + 0: [2023-05-10 12:37:49,118] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_0_mp_rank_01_optim_states.pt. + 0: [2023-05-10 12:37:49,119] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 1 +10: [2023-05-10 12:37:49,119] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 87 +15: [2023-05-10 12:37:49,119] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 123 +22: [2023-05-10 12:37:49,122] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_90_mp_rank_00_optim_states.pt. +22: [2023-05-10 12:37:49,122] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 180 + 0: [2023-05-10 12:37:49,123] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 1 +22: [2023-05-10 12:37:49,128] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 180 + 7: [2023-05-10 12:37:49,129] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_28_mp_rank_00_optim_states.pt. + 7: [2023-05-10 12:37:49,129] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 56 + 0: [2023-05-10 12:37:49,132] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_1_mp_rank_01_optim_states.pt. + 0: [2023-05-10 12:37:49,132] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 3 + 7: [2023-05-10 12:37:49,133] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 56 + 0: [2023-05-10 12:37:49,136] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 3 + 6: [2023-05-10 12:37:49,136] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_26_mp_rank_01_optim_states.pt. + 6: [2023-05-10 12:37:49,137] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 53 +23: [2023-05-10 12:37:49,138] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_93_mp_rank_01_optim_states.pt. +23: [2023-05-10 12:37:49,138] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 187 + 1: [2023-05-10 12:37:49,139] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_7_mp_rank_01_optim_states.pt. + 1: [2023-05-10 12:37:49,140] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 15 + 6: [2023-05-10 12:37:49,141] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 53 +23: [2023-05-10 12:37:49,143] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 187 + 1: [2023-05-10 12:37:49,144] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 15 +15: [2023-05-10 12:37:49,145] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_60_mp_rank_01_optim_states.pt. +15: [2023-05-10 12:37:49,145] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 121 +18: [2023-05-10 12:37:49,145] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_73_mp_rank_01_optim_states.pt. +18: [2023-05-10 12:37:49,146] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 147 + 4: [2023-05-10 12:37:49,146] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_18_mp_rank_01_optim_states.pt. + 4: [2023-05-10 12:37:49,147] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 37 + 8: [2023-05-10 12:37:49,147] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_33_mp_rank_01_optim_states.pt. + 8: [2023-05-10 12:37:49,147] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 67 +15: [2023-05-10 12:37:49,148] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_63_mp_rank_01_optim_states.pt. +15: [2023-05-10 12:37:49,148] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 127 +18: [2023-05-10 12:37:49,150] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 147 +14: [2023-05-10 12:37:49,150] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_58_mp_rank_01_optim_states.pt. + 4: [2023-05-10 12:37:49,151] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 37 +14: [2023-05-10 12:37:49,151] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 117 + 8: [2023-05-10 12:37:49,151] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 67 +15: [2023-05-10 12:37:49,152] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 121 + 6: [2023-05-10 12:37:49,152] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_27_mp_rank_01_optim_states.pt. + 6: [2023-05-10 12:37:49,152] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 55 +15: [2023-05-10 12:37:49,153] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 127 + 6: [2023-05-10 12:37:49,153] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_25_mp_rank_01_optim_states.pt. + 6: [2023-05-10 12:37:49,154] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 51 +14: [2023-05-10 12:37:49,155] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 117 + 7: [2023-05-10 12:37:49,156] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_29_mp_rank_01_optim_states.pt. + 7: [2023-05-10 12:37:49,156] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 59 +22: [2023-05-10 12:37:49,157] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_91_mp_rank_01_optim_states.pt. +22: [2023-05-10 12:37:49,157] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 183 + 6: [2023-05-10 12:37:49,157] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 55 +31: [2023-05-10 12:37:49,157] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_127_mp_rank_01_optim_states.pt. +31: [2023-05-10 12:37:49,157] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 255 + 6: [2023-05-10 12:37:49,158] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 51 + 7: [2023-05-10 12:37:49,161] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 59 +31: [2023-05-10 12:37:49,161] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 255 +22: [2023-05-10 12:37:49,162] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 183 + 3: [2023-05-10 12:37:49,172] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_13_mp_rank_01_optim_states.pt. + 3: [2023-05-10 12:37:49,172] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 27 +12: [2023-05-10 12:37:49,175] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_50_mp_rank_01_optim_states.pt. +12: [2023-05-10 12:37:49,175] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 101 +19: [2023-05-10 12:37:49,175] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_76_mp_rank_01_optim_states.pt. +19: [2023-05-10 12:37:49,175] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 153 + 3: [2023-05-10 12:37:49,177] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 27 +14: [2023-05-10 12:37:49,178] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_59_mp_rank_01_optim_states.pt. +14: [2023-05-10 12:37:49,179] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 119 + 3: [2023-05-10 12:37:49,179] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_15_mp_rank_01_optim_states.pt. +12: [2023-05-10 12:37:49,179] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 101 + 3: [2023-05-10 12:37:49,180] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 31 +19: [2023-05-10 12:37:49,180] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 153 +11: [2023-05-10 12:37:49,182] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_46_mp_rank_01_optim_states.pt. +11: [2023-05-10 12:37:49,183] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 93 +14: [2023-05-10 12:37:49,183] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 119 +16: [2023-05-10 12:37:49,183] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_66_mp_rank_01_optim_states.pt. + 3: [2023-05-10 12:37:49,184] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 31 +16: [2023-05-10 12:37:49,184] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 133 + 0: [2023-05-10 12:37:49,184] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_2_mp_rank_01_optim_states.pt. + 0: [2023-05-10 12:37:49,184] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 5 +27: [2023-05-10 12:37:49,185] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_111_mp_rank_01_optim_states.pt. +27: [2023-05-10 12:37:49,185] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 223 +11: [2023-05-10 12:37:49,187] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 93 + 2: [2023-05-10 12:37:49,187] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_8_mp_rank_01_optim_states.pt. +16: [2023-05-10 12:37:49,188] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 133 +31: [2023-05-10 12:37:49,188] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_126_mp_rank_01_optim_states.pt. + 2: [2023-05-10 12:37:49,188] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 17 +31: [2023-05-10 12:37:49,188] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 253 + 0: [2023-05-10 12:37:49,189] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 5 +27: [2023-05-10 12:37:49,189] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 223 + 2: [2023-05-10 12:37:49,192] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 17 +31: [2023-05-10 12:37:49,193] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 253 +29: [2023-05-10 12:37:49,193] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_119_mp_rank_01_optim_states.pt. +29: [2023-05-10 12:37:49,194] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 239 +17: [2023-05-10 12:37:49,194] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_70_mp_rank_01_optim_states.pt. +17: [2023-05-10 12:37:49,194] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 141 +19: [2023-05-10 12:37:49,195] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_77_mp_rank_01_optim_states.pt. +19: [2023-05-10 12:37:49,195] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 155 +23: [2023-05-10 12:37:49,197] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_92_mp_rank_01_optim_states.pt. +23: [2023-05-10 12:37:49,197] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 185 +29: [2023-05-10 12:37:49,198] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 239 +17: [2023-05-10 12:37:49,199] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 141 +16: [2023-05-10 12:37:49,199] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_64_mp_rank_01_optim_states.pt. +19: [2023-05-10 12:37:49,200] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 155 +16: [2023-05-10 12:37:49,200] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 129 +23: [2023-05-10 12:37:49,201] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 185 +16: [2023-05-10 12:37:49,204] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 129 + 9: [2023-05-10 12:37:49,204] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_36_mp_rank_01_optim_states.pt. + 9: [2023-05-10 12:37:49,205] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 73 + 2: [2023-05-10 12:37:49,206] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_10_mp_rank_01_optim_states.pt. +19: [2023-05-10 12:37:49,206] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_79_mp_rank_01_optim_states.pt. +19: [2023-05-10 12:37:49,206] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 159 + 2: [2023-05-10 12:37:49,207] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 21 + 9: [2023-05-10 12:37:49,208] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_39_mp_rank_01_optim_states.pt. + 9: [2023-05-10 12:37:49,208] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 79 +12: [2023-05-10 12:37:49,209] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_51_mp_rank_01_optim_states.pt. + 9: [2023-05-10 12:37:49,209] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 73 +12: [2023-05-10 12:37:49,209] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 103 + 2: [2023-05-10 12:37:49,211] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 21 +19: [2023-05-10 12:37:49,211] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 159 +25: [2023-05-10 12:37:49,211] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_101_mp_rank_01_optim_states.pt. +25: [2023-05-10 12:37:49,211] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 203 + 9: [2023-05-10 12:37:49,212] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 79 +12: [2023-05-10 12:37:49,214] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 103 +25: [2023-05-10 12:37:49,215] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 203 +18: [2023-05-10 12:37:49,216] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_74_mp_rank_01_optim_states.pt. +18: [2023-05-10 12:37:49,216] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 149 +29: [2023-05-10 12:37:49,219] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_117_mp_rank_01_optim_states.pt. +29: [2023-05-10 12:37:49,219] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 235 +18: [2023-05-10 12:37:49,220] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 149 + 3: [2023-05-10 12:37:49,221] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_12_mp_rank_01_optim_states.pt. + 2: [2023-05-10 12:37:49,221] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_9_mp_rank_01_optim_states.pt. + 3: [2023-05-10 12:37:49,221] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 25 + 2: [2023-05-10 12:37:49,221] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 19 + 0: [2023-05-10 12:37:49,223] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_3_mp_rank_01_optim_states.pt. +29: [2023-05-10 12:37:49,223] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 235 + 0: [2023-05-10 12:37:49,223] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 7 +21: [2023-05-10 12:37:49,224] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_87_mp_rank_01_optim_states.pt. +21: [2023-05-10 12:37:49,224] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 175 + 3: [2023-05-10 12:37:49,225] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 25 +11: [2023-05-10 12:37:49,225] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_47_mp_rank_01_optim_states.pt. + 2: [2023-05-10 12:37:49,226] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 19 +11: [2023-05-10 12:37:49,226] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 95 +14: [2023-05-10 12:37:49,227] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_57_mp_rank_01_optim_states.pt. +14: [2023-05-10 12:37:49,227] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 115 +17: [2023-05-10 12:37:49,228] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_71_mp_rank_01_optim_states.pt. +21: [2023-05-10 12:37:49,228] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 175 +17: [2023-05-10 12:37:49,228] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 143 +16: [2023-05-10 12:37:49,228] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_67_mp_rank_01_optim_states.pt. +16: [2023-05-10 12:37:49,228] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 135 + 7: [2023-05-10 12:37:49,229] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_31_mp_rank_01_optim_states.pt. + 0: [2023-05-10 12:37:49,229] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 7 + 7: [2023-05-10 12:37:49,229] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 63 +11: [2023-05-10 12:37:49,230] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 95 +14: [2023-05-10 12:37:49,231] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 115 +16: [2023-05-10 12:37:49,233] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 135 +17: [2023-05-10 12:37:49,233] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 143 + 7: [2023-05-10 12:37:49,234] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 63 + 7: [2023-05-10 12:37:49,235] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_30_mp_rank_01_optim_states.pt. + 7: [2023-05-10 12:37:49,236] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 61 +16: [2023-05-10 12:37:49,238] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_65_mp_rank_01_optim_states.pt. +16: [2023-05-10 12:37:49,238] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 131 + 7: [2023-05-10 12:37:49,239] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 61 +16: [2023-05-10 12:37:49,242] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 131 + 4: [2023-05-10 12:37:49,242] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_17_mp_rank_01_optim_states.pt. + 4: [2023-05-10 12:37:49,243] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 35 + 8: [2023-05-10 12:37:49,245] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_34_mp_rank_01_optim_states.pt. + 8: [2023-05-10 12:37:49,245] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 69 +13: [2023-05-10 12:37:49,247] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_55_mp_rank_01_optim_states.pt. +13: [2023-05-10 12:37:49,247] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 111 + 4: [2023-05-10 12:37:49,247] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 35 +29: [2023-05-10 12:37:49,247] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_118_mp_rank_01_optim_states.pt. +29: [2023-05-10 12:37:49,247] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 237 +18: [2023-05-10 12:37:49,247] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_72_mp_rank_01_optim_states.pt. +18: [2023-05-10 12:37:49,248] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 145 +14: [2023-05-10 12:37:49,249] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_56_mp_rank_01_optim_states.pt. +14: [2023-05-10 12:37:49,249] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 113 + 8: [2023-05-10 12:37:49,249] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 69 +22: [2023-05-10 12:37:49,249] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_90_mp_rank_01_optim_states.pt. +22: [2023-05-10 12:37:49,249] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 181 +13: [2023-05-10 12:37:49,251] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 111 +18: [2023-05-10 12:37:49,252] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 145 +29: [2023-05-10 12:37:49,254] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 237 +22: [2023-05-10 12:37:49,254] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 181 +14: [2023-05-10 12:37:49,255] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 113 +27: [2023-05-10 12:37:49,258] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_108_mp_rank_01_optim_states.pt. +27: [2023-05-10 12:37:49,258] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 217 +21: [2023-05-10 12:37:49,259] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_85_mp_rank_01_optim_states.pt. +21: [2023-05-10 12:37:49,259] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 171 +21: [2023-05-10 12:37:49,260] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_86_mp_rank_01_optim_states.pt. +21: [2023-05-10 12:37:49,260] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 173 +25: [2023-05-10 12:37:49,260] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_103_mp_rank_01_optim_states.pt. +25: [2023-05-10 12:37:49,260] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 207 +27: [2023-05-10 12:37:49,262] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 217 +21: [2023-05-10 12:37:49,264] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 171 +21: [2023-05-10 12:37:49,264] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 173 +25: [2023-05-10 12:37:49,265] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 207 +17: [2023-05-10 12:37:49,268] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_69_mp_rank_01_optim_states.pt. +17: [2023-05-10 12:37:49,268] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 139 +19: [2023-05-10 12:37:49,269] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_78_mp_rank_01_optim_states.pt. +19: [2023-05-10 12:37:49,269] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 157 +25: [2023-05-10 12:37:49,269] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_102_mp_rank_01_optim_states.pt. +25: [2023-05-10 12:37:49,269] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 205 +25: [2023-05-10 12:37:49,272] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_100_mp_rank_01_optim_states.pt. +25: [2023-05-10 12:37:49,273] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 201 +19: [2023-05-10 12:37:49,273] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 157 +17: [2023-05-10 12:37:49,273] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 139 +25: [2023-05-10 12:37:49,274] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 205 +25: [2023-05-10 12:37:49,277] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 201 +17: [2023-05-10 12:37:49,277] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_68_mp_rank_01_optim_states.pt. +17: [2023-05-10 12:37:49,277] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 137 +18: [2023-05-10 12:37:49,281] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_75_mp_rank_01_optim_states.pt. +18: [2023-05-10 12:37:49,281] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 151 +31: [2023-05-10 12:37:49,282] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_125_mp_rank_01_optim_states.pt. +31: [2023-05-10 12:37:49,282] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 251 +17: [2023-05-10 12:37:49,282] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 137 + 7: [2023-05-10 12:37:49,284] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_28_mp_rank_01_optim_states.pt. + 7: [2023-05-10 12:37:49,284] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 57 +18: [2023-05-10 12:37:49,285] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 151 +31: [2023-05-10 12:37:49,286] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 251 +12: [2023-05-10 12:37:49,288] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_49_mp_rank_01_optim_states.pt. +12: [2023-05-10 12:37:49,288] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 99 + 7: [2023-05-10 12:37:49,289] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 57 + 2: [2023-05-10 12:37:49,291] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_11_mp_rank_01_optim_states.pt. + 2: [2023-05-10 12:37:49,292] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 23 +12: [2023-05-10 12:37:49,292] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 99 +22: [2023-05-10 12:37:49,293] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_88_mp_rank_01_optim_states.pt. +22: [2023-05-10 12:37:49,293] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 177 +22: [2023-05-10 12:37:49,295] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_89_mp_rank_01_optim_states.pt. +22: [2023-05-10 12:37:49,295] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 179 +20: [2023-05-10 12:37:49,296] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_82_mp_rank_01_optim_states.pt. +20: [2023-05-10 12:37:49,296] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 165 + 2: [2023-05-10 12:37:49,297] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 23 +22: [2023-05-10 12:37:49,299] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 177 +22: [2023-05-10 12:37:49,300] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 179 +20: [2023-05-10 12:37:49,301] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 165 +20: [2023-05-10 12:37:49,301] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_80_mp_rank_01_optim_states.pt. +20: [2023-05-10 12:37:49,301] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 161 +20: [2023-05-10 12:37:49,305] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 161 +27: [2023-05-10 12:37:49,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_110_mp_rank_01_optim_states.pt. +27: [2023-05-10 12:37:49,309] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 221 +27: [2023-05-10 12:37:49,313] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 221 +29: [2023-05-10 12:37:49,319] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_116_mp_rank_01_optim_states.pt. +29: [2023-05-10 12:37:49,319] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 233 + 6: [2023-05-10 12:37:49,320] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_24_mp_rank_01_optim_states.pt. + 6: [2023-05-10 12:37:49,321] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 49 +13: [2023-05-10 12:37:49,322] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_52_mp_rank_01_optim_states.pt. +13: [2023-05-10 12:37:49,322] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 105 +29: [2023-05-10 12:37:49,325] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 233 +11: [2023-05-10 12:37:49,325] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_44_mp_rank_01_optim_states.pt. + 6: [2023-05-10 12:37:49,325] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 49 +11: [2023-05-10 12:37:49,325] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 89 +13: [2023-05-10 12:37:49,326] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 105 +11: [2023-05-10 12:37:49,327] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_45_mp_rank_01_optim_states.pt. +11: [2023-05-10 12:37:49,328] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 91 +11: [2023-05-10 12:37:49,330] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 89 + 9: [2023-05-10 12:37:49,331] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_38_mp_rank_01_optim_states.pt. + 9: [2023-05-10 12:37:49,331] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 77 +11: [2023-05-10 12:37:49,334] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 91 + 9: [2023-05-10 12:37:49,336] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 77 + 9: [2023-05-10 12:37:49,336] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_37_mp_rank_01_optim_states.pt. + 9: [2023-05-10 12:37:49,336] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 75 + 9: [2023-05-10 12:37:49,341] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 75 +20: [2023-05-10 12:37:49,342] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_83_mp_rank_01_optim_states.pt. +20: [2023-05-10 12:37:49,342] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 167 +27: [2023-05-10 12:37:49,342] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_109_mp_rank_01_optim_states.pt. +27: [2023-05-10 12:37:49,343] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 219 +13: [2023-05-10 12:37:49,344] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_54_mp_rank_01_optim_states.pt. +13: [2023-05-10 12:37:49,344] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 109 +20: [2023-05-10 12:37:49,347] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 167 +27: [2023-05-10 12:37:49,347] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 219 + 4: [2023-05-10 12:37:49,347] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_19_mp_rank_01_optim_states.pt. + 4: [2023-05-10 12:37:49,347] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 39 +13: [2023-05-10 12:37:49,349] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 109 + 4: [2023-05-10 12:37:49,352] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 39 +31: [2023-05-10 12:37:49,361] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_124_mp_rank_01_optim_states.pt. +31: [2023-05-10 12:37:49,361] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 249 +13: [2023-05-10 12:37:49,362] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_53_mp_rank_01_optim_states.pt. +13: [2023-05-10 12:37:49,363] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 107 +20: [2023-05-10 12:37:49,363] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_81_mp_rank_01_optim_states.pt. +20: [2023-05-10 12:37:49,363] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 163 +31: [2023-05-10 12:37:49,365] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 249 +13: [2023-05-10 12:37:49,367] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 107 +20: [2023-05-10 12:37:49,368] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 163 + 4: [2023-05-10 12:37:49,369] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_16_mp_rank_01_optim_states.pt. + 4: [2023-05-10 12:37:49,369] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 33 + 4: [2023-05-10 12:37:49,373] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 33 +12: [2023-05-10 12:37:49,434] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25/global_step80108/bf16_zero_pp_rank_48_mp_rank_01_optim_states.pt. +12: [2023-05-10 12:37:49,434] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 97 +12: [2023-05-10 12:37:49,439] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 97 + 0: successfully loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity25 at iteration 0 +31: time (ms) | load-checkpoint: 12684.70 + 0: estimated model parameters: 2.81512448 + 0: estimated model parameters without embeddings: 2.6755328 + 0: [after model, optimizer, and learning rate scheduler are built] datetime: 2023-05-10 12:37:50 + 0: > building train, validation, and test datasets ... + 0: > datasets target sizes (minimum size): + 0: train: 1 + 0: validation: 102400 + 0: test: 102400 + 0: > building train, validation, and test datasets for GPT ... + 0: > building dataset index ... + 0: reading sizes... + 0: reading pointers... + 0: reading document index... + 0: creating numpy buffer of mmap... + 0: creating memory view of numpy buffer... + 0: > finished creating indexed dataset in 0.035984 seconds + 0: number of documents: 3133972 + 0: > dataset split: + 0: train: + 0: document indices in [0, 3133972) total of 3133972 documents + 0: > loading doc-idx mapping from /scratch/project_462000119/data/c4_subsampled/gpt2tok_c4_en_1B5_text_document_train_indexmap_1ns_2048sl_1234s_doc_idx.npy + 0: > loading sample-idx mapping from /scratch/project_462000119/data/c4_subsampled/gpt2tok_c4_en_1B5_text_document_train_indexmap_1ns_2048sl_1234s_sample_idx.npy + 0: > loading shuffle-idx mapping from /scratch/project_462000119/data/c4_subsampled/gpt2tok_c4_en_1B5_text_document_train_indexmap_1ns_2048sl_1234s_shuffle_idx.npy + 0: loaded indexed file in 0.083 seconds + 0: total number of samples: 731002 + 0: total number of epochs: 1 + 0: > building dataset index ... + 0: reading sizes... + 0: reading pointers... + 0: reading document index... + 0: creating numpy buffer of mmap... + 0: creating memory view of numpy buffer... + 0: > finished creating indexed dataset in 0.032576 seconds + 0: number of documents: 364608 + 0: > dataset split: + 0: validation: + 0: document indices in [0, 364608) total of 364608 documents + 0: > loading doc-idx mapping from /scratch/project_462000119/data/c4_validation/gpt2tok_c4validation_rerun_text_document_validation_indexmap_102400ns_2048sl_1234s_doc_idx.npy + 0: > loading sample-idx mapping from /scratch/project_462000119/data/c4_validation/gpt2tok_c4validation_rerun_text_document_validation_indexmap_102400ns_2048sl_1234s_sample_idx.npy + 0: > loading shuffle-idx mapping from /scratch/project_462000119/data/c4_validation/gpt2tok_c4validation_rerun_text_document_validation_indexmap_102400ns_2048sl_1234s_shuffle_idx.npy + 0: loaded indexed file in 0.111 seconds + 0: total number of samples: 169955 + 0: total number of epochs: 2 + 0: > finished creating GPT datasets ... + 0: [after dataloaders are built] datetime: 2023-05-10 12:37:57 + 0: done with setup ... + 0: training ... +31: time (ms) | model-and-optimizer-setup: 30136.39 | train/valid/test-data-iterators-setup: 4325.97 + 0: [after training is done] datetime: 2023-05-10 12:37:57 +31: ----------------------------------------------------------------------------------------------------------------- +31: validation loss at the end of training for val data | lm loss value: 2.701157E+00 | lm loss PPL: 1.489695E+01 | +31: ----------------------------------------------------------------------------------------------------------------- +END 3491058: Wed 10 May 2023 12:39:39 PM EEST